feat: init Learning class and add drop_empty_price function

Add Python package ecosystem to Dependabot config
Configure Dependabot for Python package updates.
2026-03-28 18:03:47 +00:00 · 2026-03-28 15:51:46 +01:00 · 2026-03-27 22:11:53 +01:00 · 2026-03-27 22:06:36 +01:00 · 2026-03-27 22:06:06 +01:00
8 changed files with 78 additions and 39 deletions
--- a/.github/dependabot.yml
+++ b/.github/dependabot.yml
@@ -0,0 +1,18 @@
 # To get started with Dependabot version updates, you'll need to specify which
 # package ecosystems to update and where the package manifests are located.
 # Please see the documentation for all configuration options:
 # https://docs.github.com/code-security/dependabot/dependabot-version-updates/configuration-options-for-the-dependabot.yml-file
 version: 2
 updates:
  - package-ecosystem: "pip"
    directory: "/"
    schedule:
      interval: "weekly"
      day: "saturday"
    open-pull-requests-limit: 5
    groups:
      python-dependencies:
        patterns:
          - "*"
--- a/.github/workflows/python-app.yml
+++ b/.github/workflows/python-app.yml
@@ -19,15 +19,15 @@ jobs:
    steps:
      - uses: actions/checkout@v4
-      - name: Set up Python 3.10
+      - name: Set up Python 3.x
        uses: actions/setup-python@v4
        with:
-          python-version: "3.10"
+          python-version: "3.x"
      - name: install dependencies
        run: |
          python -m pip install --upgrade pip
-          pip install ".[test,doc]"
+          pip install ".[test]"
      - name: Lint with flake8
        run: |
--- a/.github/workflows/static.yml
+++ b/.github/workflows/static.yml
@@ -32,15 +32,14 @@ jobs:
      - name: Checkout
        uses: actions/checkout@v4
-      - name: Set up Python 3.10
+      - name: Set up Python 3.x
        uses: actions/setup-python@v5
        with:
-          python-version: '3.10'
+          python-version: '3.x'
      - name: Install dependencies
        run: |
          python -m pip install --upgrade pip
          # Installe le projet en mode éditable avec les extras de doc
          pip install -e ".[doc]"
      - name: Setup Pages
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -6,8 +6,13 @@ dependencies = [
    "beautifulsoup4==4.14.3",
    "pandas==2.3.3",
    "tqdm==4.67.3",
    "scikit-learn==1.7.2"
 ]
 [tool.pytest.ini_options]
 pythonpath = "src"
 testpaths = ["tests"]
 [project.optional-dependencies]
 test = ["pytest==8.4.2", "requests-mock==1.12.1", "flake8==7.3.0"]
 doc = ["mkdocs<2.0.0", "mkdocs-material==9.6.23", "mkdocstrings[python]"]
--- a/src/cleaning.py
+++ b/src/cleaning.py
@@ -92,18 +92,24 @@ class Cleaning:
        self._vins = self._vins.join(appellation_dummies)
        return self
    def drop_empty_price(self) -> "Cleaning":
        self._vins = self._vins.dropna(subset=["Prix"])
        return self
 def main() -> None:
    if len(argv) != 2:
        raise ValueError(f"Usage: {argv[0]} <filename.csv>")
    filename = argv[1]
-    cleaning: Cleaning = Cleaning(filename)
+    cleaning: Cleaning = (
-    cleaning.drop_empty_appellation()   \
+        Cleaning(filename)
-        .fill_missing_scores()          \
+        .drop_empty_appellation()
-        .encode_appellation()           \
+        .fill_missing_scores()
-        .getVins()                      \
+        .encode_appellation()
-        .to_csv("clean.csv", index=False)
+        .drop_empty_price()
    )
    cleaning.getVins().to_csv("clean.csv", index=False)
 if __name__ == "__main__":
--- a/src/learning.py
+++ b/src/learning.py
@@ -0,0 +1,31 @@
 #!/usr/bin/env python3
 from typing import Any, Callable
 from pandas import DataFrame
 from sklearn.linear_model import LinearRegression
 from sklearn.model_selection import train_test_split
 from sklearn.pipeline import make_pipeline
 class Learning:
    def __init__(self, vins: DataFrame, target: str) -> None:
        self.X = vins.drop(target, axis=1)
        self.y = vins[target]
        self.X_train, self.X_test, self.y_train, self.y_test = train_test_split(
            self.X, self.y, test_size=0.25, random_state=49
        )
    def evaluate(
        self,
        estimator,
        pretreatment=None,
        fn_score=lambda m, xt, yt: m.score(xt, yt),
    ):
        pipeline = make_pipeline(pretreatment, estimator) if pretreatment else estimator
        pipeline.fit(self.X_train, self.y_train)
        score = fn_score(pipeline, self.X_test, self.y_test)
        prediction = pipeline.predict(self.X_test)
        return score, prediction
--- a/src/scraper.py
+++ b/src/scraper.py
@@ -377,18 +377,10 @@ class Scraper:
        try:
            data: dict[str, object] = self.getjsondata(subdir).getdata()
            # Changement dans la maniere du site stocke ses données.
            #  
            # for element in ["initialReduxState", "categ", "content"]:
            #     data = cast(dict[str, object], data.get(element))
            #     print(data)
            products: list[dict[str, Any]] = cast(
                list[dict[str, Any]], data.get("products")
            )
            print(products)
            return products
        except (JSONDecodeError, HTTPError):
--- a/tests/test_scraper.py
+++ b/tests/test_scraper.py
@@ -185,17 +185,11 @@ def mock_site():
                        {dumps({
                            "props": {
                                "pageProps": {
-                                    "initialReduxState": {
+                                    "products": [
-                                        "categ": {
+                                        {"seoKeyword": "/nino-negri-5-stelle-sfursat-2022.html",},
-                                            "content": {
+                                        {"seoKeyword": "/poubelle",},
-                                                "products": [
+                                        {"seoKeyword": "/",}
-                                                    {"seoKeyword": "/nino-negri-5-stelle-sfursat-2022.html",},
+                                    ]
                                                    {"seoKeyword": "/poubelle",},
                                                    {"seoKeyword": "/",}
                                                ]
                                            }
                                        }
                                    }
                                }
                            }
                        }
@@ -213,14 +207,8 @@ def mock_site():
                        {dumps({
                            "props": {
                                "pageProps": {
-                                    "initialReduxState": {
+                                    "products": [
-                                        "categ": {
+                                    ]
                                            "content": {
                                                "products": [
                                                ]
                                            }
                                        }
                                    }
                                }
                            }
                        }
Author	SHA1	Message	Date
Loïc GUEZO	106877a073	feat: init Learning class and add drop_empty_price function	2026-03-28 15:51:46 +01:00
Loïc GUEZO	416cfcbf8b	Add Python package ecosystem to Dependabot config Configure Dependabot for Python package updates.	2026-03-27 22:11:53 +01:00
Loïc GUEZO	32c5310e37	fix: mettre à jour les tests pytest	2026-03-27 22:06:36 +01:00
Loïc GUEZO	9dfc7457a0	fix(scraper.py): retirer commentaire code et print	2026-03-27 22:06:06 +01:00