dataforgoodfr
diff --git a/‎browser-extension/README.md‎
Lines changed: 5 additions & 11 deletions b/‎browser-extension/README.md‎
Lines changed: 5 additions & 11 deletions
diff --git a/‎browser-extension/entrypoints/background/index.ts‎
Lines changed: 1 addition & 1 deletion b/‎browser-extension/entrypoints/background/index.ts‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎browser-extension/entrypoints/background/scraping/instagram/instagram-scraper.ts‎
Lines changed: 127 additions & 127 deletions b/‎browser-extension/entrypoints/background/scraping/instagram/instagram-scraper.ts‎
Lines changed: 127 additions & 127 deletions
diff --git a/‎browser-extension/entrypoints/background/scraping/puppeteer/ariaLabel.ts‎
Lines changed: 1 addition & 1 deletion b/‎browser-extension/entrypoints/background/scraping/puppeteer/ariaLabel.ts‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎browser-extension/entrypoints/background/scraping/puppeteer/selectOrThrow.ts‎
Lines changed: 1 addition & 1 deletion b/‎browser-extension/entrypoints/background/scraping/puppeteer/selectOrThrow.ts‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎browser-extension/entrypoints/background/scraping/scrap-tab.ts‎
Lines changed: 1 addition & 1 deletion b/‎browser-extension/entrypoints/background/scraping/scrap-tab.ts‎
Lines changed: 1 addition & 1 deletion
@@ -1,25 +1,19 @@
 # Extension Navigateur Balance Tes Haters
 
-
 Cette extension permet de capturer les commentaires depuis des publications réseau sociaux.
 
-
-
 # Contributing
 
 Cette extension utilise [wxt](https://wxt.dev/) + React
 
 ## Installation
 
-* Installer pnpm
-* `pnpm install` dans le repertoire extension
+- Installer pnpm
+- `pnpm install` dans le repertoire extension
 
 ## Mode dev (avec chrome)
 
-* Lancer `pnpm dev`
-* Charger le répertoire .output/chrome-mv3-dev comme extension non empaqueté (see https://developer.chrome.com/docs/extensions/get-started/tutorial/hello-world#load-unpacked)
-
-
-A partir de là la plupart des changements sont propagé automatiquement dans l'extension navigateur sans besoin de rafraichir manuellement l'extension. 
-
+- Lancer `pnpm dev`
+- Charger le répertoire .output/chrome-mv3-dev comme extension non empaqueté (see https://developer.chrome.com/docs/extensions/get-started/tutorial/hello-world#load-unpacked)
 
+A partir de là la plupart des changements sont propagé automatiquement dans l'extension navigateur sans besoin de rafraichir manuellement l'extension.
@@ -8,7 +8,7 @@ export default defineBackground(() => {
 
   async function handleMessages(
     message: Message,
-    sender: Browser.runtime.MessageSender
+    sender: Browser.runtime.MessageSender,
   ) {
     console.debug("Message received:", message, sender);
 
 
@@ -1,156 +1,156 @@
 import {
-    ElementHandle,
-    Page,
+  ElementHandle,
+  Page,
 } from "puppeteer-core/lib/esm/puppeteer/puppeteer-core-browser.js";
 import { PuppeteerBaseScraper } from "../puppeteer/puppeteer-base-scraper";
 import {
-    type Author,
-    type Post,
-    type Comment,
+  type Author,
+  type Post,
+  type Comment,
 } from "../../../shared/model/post";
 import { parseSocialNetworkUrl } from "@/entrypoints/shared/social-network-url";
 import { currentIsoDate } from "../utils/current-iso-date";
 
 //TODO: gérer le scroll et le chargement des commentaires
 //TODO: gérer le scraping des réponses aux commentaires
 export class InstagramScraper extends PuppeteerBaseScraper {
-    private INSTAGRAM_URL = "https://www.instagram.com/";
+  private INSTAGRAM_URL = "https://www.instagram.com/";
 
-    extractPostId(url: string): string {
-        const parsed = parseSocialNetworkUrl(url);
-        if (!parsed) {
-            throw new Error("Unexpected");
-        }
-        return parsed.postId;
+  extractPostId(url: string): string {
+    const parsed = parseSocialNetworkUrl(url);
+    if (!parsed) {
+      throw new Error("Unexpected");
     }
+    return parsed.postId;
+  }
 
-    async doScrapTab(tab: Browser.tabs.Tab, page: Page): Promise<Post> {
-        // //main/div/div/div
-        const cadre_publication = (await page.$("::-p-xpath(//main/div/div/div)"))!;
-        const colonne_commentaires = (await cadre_publication.$(
-            "::-p-xpath(./div[2]/div)"
-        ))!;
+  async doScrapTab(tab: Browser.tabs.Tab, page: Page): Promise<Post> {
+    // //main/div/div/div
+    const cadre_publication = (await page.$("::-p-xpath(//main/div/div/div)"))!;
+    const colonne_commentaires = (await cadre_publication.$(
+      "::-p-xpath(./div[2]/div)",
+    ))!;
 
-        // //main/div/div/div/./div[2]/div/./div[2]
-        const zone_defilable = (await colonne_commentaires.$(
-            "::-p-xpath(./div[2])"
-        ))!;
+    // //main/div/div/div/./div[2]/div/./div[2]
+    const zone_defilable = (await colonne_commentaires.$(
+      "::-p-xpath(./div[2])",
+    ))!;
 
-        // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span
-        const publication = (await zone_defilable.$(
-            "::-p-xpath(./div/div[1]/div/div[2]/div/span)"
-        ))!;
+    // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span
+    const publication = (await zone_defilable.$(
+      "::-p-xpath(./div/div[1]/div/div[2]/div/span)",
+    ))!;
 
-        // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span/./div/div
-        const entete_publication = (await publication.$("::-p-xpath(./div/div)"))!;
+    // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span/./div/div
+    const entete_publication = (await publication.$("::-p-xpath(./div/div)"))!;
 
-        // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span/./span[1]
-        const auteur = await this.get_auteur_from_span(
-            (await entete_publication.$("::-p-xpath(./span[1])"))!
-        );
+    // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span/./span[1]
+    const auteur = await this.get_auteur_from_span(
+      (await entete_publication.$("::-p-xpath(./span[1])"))!,
+    );
 
-        // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span/./div/div/.//time
-        const date_publication = (await entete_publication.$eval(
-            "::-p-xpath(.//time)",
-            (node) => node.getAttribute("datetime")
-        ))!;
+    // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span/./div/div/.//time
+    const date_publication = (await entete_publication.$eval(
+      "::-p-xpath(.//time)",
+      (node) => node.getAttribute("datetime"),
+    ))!;
 
-        // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span/./div/span
-        const texte_publication = (await publication.$eval(
-            "::-p-xpath(./div/span)",
-            (node) => node.textContent
-        ))!;
+    // //main/div/div/div/./div[2]/div/./div[2]/./div/div[1]/div/div[2]/div/span/./div/span
+    const texte_publication = (await publication.$eval(
+      "::-p-xpath(./div/span)",
+      (node) => node.textContent,
+    ))!;
 
-        // //main/div/div/div/./div[2]/div/./div[2]/./div/div[3]
-        const liste_commentaires = (await zone_defilable.$(
-            "::-p-xpath(./div/div[3])"
-        ))!;
-        //const commentaires = (await liste_commentaires.$$("::-p-xpath(./div)")).map(e => this.extract_commentaire(e))!;
-        const commentaires: Comment[] = [];
-        let div_commentaire = await liste_commentaires.$("::-p-xpath(./div)");
-        while (div_commentaire) {
-            await div_commentaire.scrollIntoView();
-            commentaires.push(await this.extract_commentaire(div_commentaire));
-            await this.sleep(500);
-            // gérer un peu mieux le scroll et le temps de chargement des pages de
-            // commentaires
-            div_commentaire = await div_commentaire.$(
-                "::-p-xpath(./following-sibling::*)"
-            );
-            // gérer ici le ce scraping des réponses aux commentaires
-        }
-
-        return {
-            postId: this.extractPostId(tab.url!),
-            socialNetwork: "INSTAGRAM",
-            url: tab.url!,
-            author: auteur,
-            scrapedAt: new Date().toISOString(),
-            publishedAt: new Date(date_publication).toISOString(),
-            textContent: texte_publication,
-            comments: await Promise.all(commentaires),
-        };
+    // //main/div/div/div/./div[2]/div/./div[2]/./div/div[3]
+    const liste_commentaires = (await zone_defilable.$(
+      "::-p-xpath(./div/div[3])",
+    ))!;
+    //const commentaires = (await liste_commentaires.$$("::-p-xpath(./div)")).map(e => this.extract_commentaire(e))!;
+    const commentaires: Comment[] = [];
+    let div_commentaire = await liste_commentaires.$("::-p-xpath(./div)");
+    while (div_commentaire) {
+      await div_commentaire.scrollIntoView();
+      commentaires.push(await this.extract_commentaire(div_commentaire));
+      await this.sleep(500);
+      // gérer un peu mieux le scroll et le temps de chargement des pages de
+      // commentaires
+      div_commentaire = await div_commentaire.$(
+        "::-p-xpath(./following-sibling::*)",
+      );
+      // gérer ici le ce scraping des réponses aux commentaires
     }
 
-    private async get_auteur_from_span(
-        span_element: ElementHandle<Element>
-    ): Promise<Author> {
-        const auteur_elem = (await span_element.$("::-p-xpath(.//a)"))!;
-        const auteur_href = (await auteur_elem.$eval("::-p-xpath(.)", (node) =>
-            node.getAttribute("href")
-        ))!;
-        const auteur_name = (await auteur_elem.$eval(
-            "::-p-xpath(.//span)",
-            (node) => node.textContent
-        ))!;
-        return {
-            name: auteur_name,
-            accountHref: this.urlJoin(this.INSTAGRAM_URL, auteur_href),
-        };
-    }
+    return {
+      postId: this.extractPostId(tab.url!),
+      socialNetwork: "INSTAGRAM",
+      url: tab.url!,
+      author: auteur,
+      scrapedAt: new Date().toISOString(),
+      publishedAt: new Date(date_publication).toISOString(),
+      textContent: texte_publication,
+      comments: await Promise.all(commentaires),
+    };
+  }
 
-    private async extract_commentaire(
-        comment_element: ElementHandle<Element>
-    ): Promise<Comment> {
-        let base = (await comment_element.$(
-            "::-p-xpath(./div/div/div[2]/div/div)"
-        ))!;
-        base = (await base.$("::-p-xpath(.//span[1]/../..)"))!;
-        const base_0 = (await base.$("::-p-xpath(div[1])"))!;
-        const base_1 = (await base.$("::-p-xpath(div[2])"))!;
-        const auteur = await this.get_auteur_from_span(base_0);
-        let date_commentaire: Date | undefined = undefined;
-        try {
-            const date_str = (await base.$eval("::-p-xpath(.//time)", (node) =>
-                node.getAttribute("datetime")
-            ))!;
-            date_commentaire = date_str ? new Date(date_str) : undefined;
-        } catch (_) {
-            date_commentaire = undefined;
-        }
+  private async get_auteur_from_span(
+    span_element: ElementHandle<Element>,
+  ): Promise<Author> {
+    const auteur_elem = (await span_element.$("::-p-xpath(.//a)"))!;
+    const auteur_href = (await auteur_elem.$eval("::-p-xpath(.)", (node) =>
+      node.getAttribute("href"),
+    ))!;
+    const auteur_name = (await auteur_elem.$eval(
+      "::-p-xpath(.//span)",
+      (node) => node.textContent,
+    ))!;
+    return {
+      name: auteur_name,
+      accountHref: this.urlJoin(this.INSTAGRAM_URL, auteur_href),
+    };
+  }
 
-        const screenshot = await comment_element.screenshot({ encoding: "base64" });
-        const screenshotDate = currentIsoDate();
-        return {
-            author: auteur,
-            textContent: await base_1.$eval(
-                "::-p-xpath(.)",
-                (node) => node.textContent!
-            )!,
-            publishedAt: date_commentaire?.toISOString(),
-            screenshotData: screenshot,
-            scrapedAt: screenshotDate,
-            replies: [],
-            nbLikes: 0    // Voir https://github.com/dataforgoodfr/14_BalanceTesHaters/issues/4
-        };
+  private async extract_commentaire(
+    comment_element: ElementHandle<Element>,
+  ): Promise<Comment> {
+    let base = (await comment_element.$(
+      "::-p-xpath(./div/div/div[2]/div/div)",
+    ))!;
+    base = (await base.$("::-p-xpath(.//span[1]/../..)"))!;
+    const base_0 = (await base.$("::-p-xpath(div[1])"))!;
+    const base_1 = (await base.$("::-p-xpath(div[2])"))!;
+    const auteur = await this.get_auteur_from_span(base_0);
+    let date_commentaire: Date | undefined = undefined;
+    try {
+      const date_str = (await base.$eval("::-p-xpath(.//time)", (node) =>
+        node.getAttribute("datetime"),
+      ))!;
+      date_commentaire = date_str ? new Date(date_str) : undefined;
+    } catch (_) {
+      date_commentaire = undefined;
     }
 
-    private urlJoin(base: string, relative: string): string {
-        const baseWithoutTrailingSlash = base.replace(/\/+$/, "");
-        if (relative.startsWith("/")) {
-            return baseWithoutTrailingSlash + relative;
-        } else {
-            return baseWithoutTrailingSlash + "/" + relative;
-        }
+    const screenshot = await comment_element.screenshot({ encoding: "base64" });
+    const screenshotDate = currentIsoDate();
+    return {
+      author: auteur,
+      textContent: await base_1.$eval(
+        "::-p-xpath(.)",
+        (node) => node.textContent!,
+      )!,
+      publishedAt: date_commentaire?.toISOString(),
+      screenshotData: screenshot,
+      scrapedAt: screenshotDate,
+      replies: [],
+      nbLikes: 0, // Voir https://github.com/dataforgoodfr/14_BalanceTesHaters/issues/4
+    };
+  }
+
+  private urlJoin(base: string, relative: string): string {
+    const baseWithoutTrailingSlash = base.replace(/\/+$/, "");
+    if (relative.startsWith("/")) {
+      return baseWithoutTrailingSlash + relative;
+    } else {
+      return baseWithoutTrailingSlash + "/" + relative;
     }
+  }
 }
@@ -1,7 +1,7 @@
 import { ElementHandle } from "puppeteer-core/lib/esm/puppeteer/puppeteer-core-browser.js";
 
 export async function ariaLabel(
-  element: ElementHandle
+  element: ElementHandle,
 ): Promise<string | null> {
   return await element.evaluate((e) => (e as HTMLElement).ariaLabel);
 }
@@ -3,7 +3,7 @@ import { innerHtml } from "./innerHtml";
 
 export async function selectOrThrow(
   container: ElementHandle,
-  selector: string
+  selector: string,
 ): Promise<ElementHandle> {
   const selectedElement = await container.$(selector)!;
 
 
@@ -3,7 +3,7 @@ import { Post } from "../../shared/model/post";
 import { createScraper } from "./create-scraper";
 
 export async function scrapTab(
-  tab: globalThis.Browser.tabs.Tab
+  tab: globalThis.Browser.tabs.Tab,
 ): Promise<Post> {
   if (tab.url === undefined) {
     throw new Error("Url of tab is undefined");
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,7 @@`
`1`	`1`	`import { ElementHandle } from "puppeteer-core/lib/esm/puppeteer/puppeteer-core-browser.js";`
`2`	`2`
`3`	`3`	`export async function ariaLabel(`
`4`		`- element: ElementHandle`
	`4`	`+ element: ElementHandle,`
`5`	`5`	`): Promise<string \| null> {`
`6`	`6`	`return await element.evaluate((e) => (e as HTMLElement).ariaLabel);`
`7`	`7`	`}`