gabykim commited on
Commit
16bbb61
·
1 Parent(s): c20abe2

code provider classes implemented

Browse files
src/know_lang_bot/parser/providers/filesystem.py ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from pathlib import Path
2
+ from typing import Generator
3
+ from know_lang_bot.config import AppConfig
4
+ from know_lang_bot.parser.base.provider import CodeProvider
5
+ import os
6
+
7
+ class FilesystemProvider(CodeProvider):
8
+ """Provides code files from a filesystem directory"""
9
+ def __init__(self, directory: Path, config: AppConfig):
10
+ self.directory = directory
11
+ self.config = config
12
+
13
+ def get_files(self) -> Generator[Path, None, None]:
14
+ for dirpath, _, filenames in os.walk(self.directory):
15
+ dir_path = Path(dirpath)
16
+ if not self.config.parser.path_patterns.should_process_path(dir_path):
17
+ continue
18
+
19
+ for filename in filenames:
20
+ file_path = dir_path / filename
21
+ if self.config.parser.path_patterns.should_process_path(file_path):
22
+ yield file_path
src/know_lang_bot/parser/providers/git.py ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ from pathlib import Path
2
+ from typing import Generator
3
+ from git import Repo
4
+ from know_lang_bot.config import AppConfig
5
+ from know_lang_bot.parser.base.provider import CodeProvider
6
+ import os
7
+
8
+
9
+ class GitProvider(CodeProvider):
10
+ """Provides code files from a Git repository"""
11
+ def __init__(self, repo_path: Path, config: AppConfig):
12
+ self.repo_path = repo_path
13
+ self.config = config
14
+ self._validate_repo()
15
+
16
+ def _validate_repo(self):
17
+ """Validate that the repository exists and is not bare"""
18
+ if not (self.repo_path / '.git').exists():
19
+ raise ValueError(f"No git repository found at {self.repo_path}")
20
+ repo = Repo(self.repo_path)
21
+ if repo.bare:
22
+ raise ValueError(f"Repository {self.repo_path} is bare")
23
+
24
+ def get_files(self) -> Generator[Path, None, None]:
25
+ repo = Repo(self.repo_path)
26
+ for dirpath, _, filenames in os.walk(repo.working_tree_dir):
27
+ dir_path = Path(dirpath)
28
+ if repo.ignored(dir_path) or not self.config.parser.path_patterns.should_process_path(dir_path):
29
+ continue
30
+
31
+ for filename in filenames:
32
+ file_path = dir_path / filename
33
+ if (not repo.ignored(file_path) and
34
+ self.config.parser.path_patterns.should_process_path(file_path)):
35
+ yield file_path