Spaces:

ss567uhg
/

nlpWeb

Sleeping

Sophia Koehler commited on Nov 11, 2024

Commit

a8a9cd5

1 Parent(s): 2fa43bc

fix3

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,9 +1,10 @@
 # -*- coding: utf-8 -*-
-from dataclasses import dataclass
 import pickle
 import os
-from typing import Iterable, Callable, List, Dict, Optional, Type, TypeVar
 from nlp4web_codebase.ir.data_loaders.dm import Document
 from collections import Counter
 import tqdm
@@ -11,6 +12,10 @@ import re
 import nltk
 nltk.download("stopwords", quiet=True)
 from nltk.corpus import stopwords as nltk_stopwords
 LANGUAGE = "english"
 word_splitter = re.compile(r"(?u)\b\w\w+\b").findall
@@ -133,21 +138,8 @@ def run_counting(
         doc_texts=doc_texts,
     )
-from nlp4web_codebase.ir.data_loaders.sciq import load_sciq
-sciq = load_sciq()
-counting = run_counting(documents=iter(sciq.corpus), ndocs=len(sciq.corpus))
 """### BM25 Index"""
-from __future__ import annotations
-from dataclasses import asdict, dataclass
-import math
-import os
-from typing import Iterable, List, Optional, Type
-import tqdm
-from nlp4web_codebase.ir.data_loaders.dm import Document
 @dataclass
 class BM25Index(InvertedIndex):
@@ -237,11 +229,6 @@ class BM25Index(InvertedIndex):
 """### BM25 Retriever"""
-from nlp4web_codebase.ir.models import BaseRetriever
-from typing import Type
-from abc import abstractmethod
 class BaseInvertedIndexRetriever(BaseRetriever):
     @property
@@ -301,9 +288,6 @@ class BM25Retriever(BaseInvertedIndexRetriever):
         return BM25Index
-import gradio as gr
-from typing import TypedDict
 class Hit(TypedDict):
   cid: str
   score: float

 # -*- coding: utf-8 -*-
+from dataclasses import asdict, dataclass
 import pickle
 import os
+from __future__ import annotations
+from typing import Iterable, Callable, List, Dict, Optional, Type, TypeVar, TypedDict
 from nlp4web_codebase.ir.data_loaders.dm import Document
 from collections import Counter
 import tqdm
 import nltk
 nltk.download("stopwords", quiet=True)
 from nltk.corpus import stopwords as nltk_stopwords
+import math
+from nlp4web_codebase.ir.models import BaseRetriever
+from abc import abstractmethod
+import gradio as gr
 LANGUAGE = "english"
 word_splitter = re.compile(r"(?u)\b\w\w+\b").findall
         doc_texts=doc_texts,
     )
 """### BM25 Index"""
 @dataclass
 class BM25Index(InvertedIndex):
 """### BM25 Retriever"""
 class BaseInvertedIndexRetriever(BaseRetriever):
     @property
         return BM25Index
 class Hit(TypedDict):
   cid: str
   score: float