Spaces:
Running
Running
fix SET 26 CRs not found
Browse files- classes.py +15 -8
- requirements.txt +2 -1
classes.py
CHANGED
|
@@ -48,21 +48,28 @@ class ETSIDocFinder:
|
|
| 48 |
|
| 49 |
def search_document(self, doc_id: str):
|
| 50 |
original = doc_id
|
| 51 |
-
|
| 52 |
main_tsg, workgroup, doc = self.get_workgroup(doc_id)
|
| 53 |
urls = []
|
| 54 |
if main_tsg:
|
| 55 |
wg_url = self.find_workgroup_url(main_tsg, workgroup)
|
| 56 |
print(wg_url)
|
| 57 |
if wg_url:
|
| 58 |
-
|
| 59 |
-
print(
|
| 60 |
-
for
|
| 61 |
-
if doc in
|
| 62 |
-
|
| 63 |
-
doc_url = f"{wg_url}/{f}"
|
| 64 |
urls.append(doc_url)
|
| 65 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 66 |
|
| 67 |
class ETSISpecFinder:
|
| 68 |
def __init__(self):
|
|
|
|
| 48 |
|
| 49 |
def search_document(self, doc_id: str):
|
| 50 |
original = doc_id
|
| 51 |
+
|
| 52 |
main_tsg, workgroup, doc = self.get_workgroup(doc_id)
|
| 53 |
urls = []
|
| 54 |
if main_tsg:
|
| 55 |
wg_url = self.find_workgroup_url(main_tsg, workgroup)
|
| 56 |
print(wg_url)
|
| 57 |
if wg_url:
|
| 58 |
+
entries = self.get_docs_from_url(wg_url)
|
| 59 |
+
print(entries)
|
| 60 |
+
for entry in entries:
|
| 61 |
+
if doc in entry.lower() or original in entry:
|
| 62 |
+
doc_url = f"{wg_url}/{entry}"
|
|
|
|
| 63 |
urls.append(doc_url)
|
| 64 |
+
elif "." not in entry.rstrip("/"):
|
| 65 |
+
# looks like a subdirectory — go one level deeper
|
| 66 |
+
sub_url = f"{wg_url}/{entry}"
|
| 67 |
+
files = self.get_docs_from_url(sub_url)
|
| 68 |
+
for f in files:
|
| 69 |
+
if doc in f.lower() or original in f:
|
| 70 |
+
print(f)
|
| 71 |
+
urls.append(f"{sub_url}/{f}")
|
| 72 |
+
return urls[0] if len(urls) == 1 else urls[-1] if len(urls) > 1 else f"Document {doc_id} not found"
|
| 73 |
|
| 74 |
class ETSISpecFinder:
|
| 75 |
def __init__(self):
|
requirements.txt
CHANGED
|
@@ -11,4 +11,5 @@ scikit-learn
|
|
| 11 |
nltk
|
| 12 |
bm25s[full]
|
| 13 |
jax[cpu]
|
| 14 |
-
datasets==3.6.0
|
|
|
|
|
|
| 11 |
nltk
|
| 12 |
bm25s[full]
|
| 13 |
jax[cpu]
|
| 14 |
+
datasets==3.6.0
|
| 15 |
+
huggingface_hub==0.34.6
|