Skip to content

Commit ddd0a8c

Browse files
authored
Merge pull request #41 from obeone/reorganize-project
Reorganize project
2 parents 312b091 + d0d4acf commit ddd0a8c

8 files changed

Lines changed: 14 additions & 12 deletions

File tree

.dockerignore

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,3 +7,6 @@
77
/output
88
__pycache__
99
.git
10+
/pytest_cahe
11+
/tests
12+
/.github

main.py

Lines changed: 5 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,17 +1,16 @@
1-
from turtle import title
2-
import log_setup
1+
import src.log_setup as log_setup
32
import os
43
import argparse
5-
import utils
4+
import src.utils as utils
65
import sys
76

87
# Setup logging based on environment variable or default to WARN level before importing other modules.
98
log_level = os.getenv("LOG_LEVEL", "WARN")
109
log_setup.setup_logging(log_level)
1110

12-
from database_manager import DatabaseManager
13-
from export_manager import ExportManager
14-
from scraper import Scraper
11+
from src.database_manager import DatabaseManager
12+
from src.export_manager import ExportManager
13+
from src.scraper import Scraper
1514

1615
logger = log_setup.get_logger()
1716
logger.name = "main"

src/__init__.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
# Package initialization file
Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
import json
2-
from database_manager import DatabaseManager
3-
import log_setup
2+
from . import log_setup
3+
from .database_manager import DatabaseManager
44
import os
55
from tqdm import tqdm
66

File renamed without changes.

scraper.py renamed to src/scraper.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,11 +2,11 @@
22
import requests
33
from bs4 import BeautifulSoup
44
from urllib.parse import urljoin, urldefrag
5-
import log_setup
5+
from . import log_setup
66
import trafilatura
77
import mdformat
88
import json
9-
from database_manager import DatabaseManager
9+
from .database_manager import DatabaseManager
1010
from tqdm import tqdm
1111
import coloredlogs
1212
import time

utils.py renamed to src/utils.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
import log_setup # Add log messages
1+
from . import log_setup # Add log messages
22
from urllib.parse import urlparse, urlunparse
33

44
logger = log_setup.get_logger()
@@ -99,4 +99,3 @@ def deduplicate_list(input_list):
9999
seen = set()
100100
deduplicated_list = [x for x in input_list if not (x in seen or seen.add(x))]
101101
return deduplicated_list
102-

0 commit comments

Comments
 (0)