heymenn commited on
Commit
d9ebd80
·
1 Parent(s): 3b1bcb1

fix SET 26 CRs not found

Browse files
Files changed (2) hide show
  1. classes.py +15 -8
  2. requirements.txt +2 -1
classes.py CHANGED
@@ -48,21 +48,28 @@ class ETSIDocFinder:
48
 
49
  def search_document(self, doc_id: str):
50
  original = doc_id
51
-
52
  main_tsg, workgroup, doc = self.get_workgroup(doc_id)
53
  urls = []
54
  if main_tsg:
55
  wg_url = self.find_workgroup_url(main_tsg, workgroup)
56
  print(wg_url)
57
  if wg_url:
58
- files = self.get_docs_from_url(wg_url)
59
- print(files)
60
- for f in files:
61
- if doc in f.lower() or original in f:
62
- print(f)
63
- doc_url = f"{wg_url}/{f}"
64
  urls.append(doc_url)
65
- return urls[0] if len(urls) == 1 else urls[-2] if len(urls) > 1 else f"Document {doc_id} not found"
 
 
 
 
 
 
 
 
66
 
67
  class ETSISpecFinder:
68
  def __init__(self):
 
48
 
49
  def search_document(self, doc_id: str):
50
  original = doc_id
51
+
52
  main_tsg, workgroup, doc = self.get_workgroup(doc_id)
53
  urls = []
54
  if main_tsg:
55
  wg_url = self.find_workgroup_url(main_tsg, workgroup)
56
  print(wg_url)
57
  if wg_url:
58
+ entries = self.get_docs_from_url(wg_url)
59
+ print(entries)
60
+ for entry in entries:
61
+ if doc in entry.lower() or original in entry:
62
+ doc_url = f"{wg_url}/{entry}"
 
63
  urls.append(doc_url)
64
+ elif "." not in entry.rstrip("/"):
65
+ # looks like a subdirectory — go one level deeper
66
+ sub_url = f"{wg_url}/{entry}"
67
+ files = self.get_docs_from_url(sub_url)
68
+ for f in files:
69
+ if doc in f.lower() or original in f:
70
+ print(f)
71
+ urls.append(f"{sub_url}/{f}")
72
+ return urls[0] if len(urls) == 1 else urls[-1] if len(urls) > 1 else f"Document {doc_id} not found"
73
 
74
  class ETSISpecFinder:
75
  def __init__(self):
requirements.txt CHANGED
@@ -11,4 +11,5 @@ scikit-learn
11
  nltk
12
  bm25s[full]
13
  jax[cpu]
14
- datasets==3.6.0
 
 
11
  nltk
12
  bm25s[full]
13
  jax[cpu]
14
+ datasets==3.6.0
15
+ huggingface_hub==0.34.6