|
@@ -37,82 +37,75 @@ class basicQueries:
|
|
|
|
|
|
|
|
|
|
|
|
- def findtexts(self, type, df, index = None):
|
|
|
- if index is None:
|
|
|
+ def findtexts(self, type, df, index=None):
|
|
|
+
|
|
|
+ if not isinstance(df, pd.DataFrame):
|
|
|
df = pd.DataFrame(df)
|
|
|
- else:
|
|
|
+
|
|
|
+ if index is not None:
|
|
|
if isinstance(index, range):
|
|
|
index = list(index)
|
|
|
elif not isinstance(index, list):
|
|
|
index = [index]
|
|
|
- df = pd.DataFrame(df.loc[index])
|
|
|
- textlist = pd.DataFrame()
|
|
|
- codList = list(df["cod"])
|
|
|
+ df = df.loc[index]
|
|
|
+
|
|
|
+ codList = [row['cod'] for _, row in df.iterrows()]
|
|
|
+
|
|
|
listOcc = self.listOcc
|
|
|
-
|
|
|
+
|
|
|
queryData = {'queryType': 'texts', 'querySubtype': type, 'codList': codList}
|
|
|
-
|
|
|
- for table in listOcc:
|
|
|
- queryData['table'] = table
|
|
|
- if type==2:
|
|
|
- subQueryData = {'queryType': 'pfl', 'codList': codList}
|
|
|
- subdf = self.queryHandler.query(subQueryData, pandas=True)
|
|
|
- queryData['formCodList'] = list(subdf['codForma'])
|
|
|
-
|
|
|
- extendequeryReponse = self.queryHandler.query(queryData, pandas=True)
|
|
|
-
|
|
|
- textlist = pd.concat([textlist, extendequeryReponse])
|
|
|
-
|
|
|
+
|
|
|
+
|
|
|
+ if type == 2:
|
|
|
+ subQueryData = {'queryType': 'pfl', 'codList': codList}
|
|
|
+ subdf = self.queryHandler.query(subQueryData, pandas=True)
|
|
|
+ queryData['formCodList'] = list(subdf['codForma'])
|
|
|
+
|
|
|
+ queryResponses = [self.queryHandler.query(dict(queryData, table=table), pandas=True) for table in listOcc]
|
|
|
+ textlist = pd.concat(queryResponses)
|
|
|
return textlist
|
|
|
|
|
|
|
|
|
|
|
|
def findcontexts(self, textlist):
|
|
|
+
|
|
|
+
|
|
|
parole = 31
|
|
|
+
|
|
|
listOcc = self.listOcc
|
|
|
+
|
|
|
contexts = []
|
|
|
formats = []
|
|
|
minChar_list = []
|
|
|
maxChar_list = []
|
|
|
+
|
|
|
for _, row in textlist.iterrows():
|
|
|
+
|
|
|
sigla = row["sigla"]
|
|
|
ntxlocal = row["ntx"]
|
|
|
mappalocal = row["mappa"]
|
|
|
+
|
|
|
queryData_list = [{'table': table, 'queryType': 'contexts', 'ntxlocal': ntxlocal, 'mappalocal': mappalocal, 'parole': parole} for table in listOcc]
|
|
|
+
|
|
|
pointerlist = pd.concat([self.queryHandler.query(queryData, pandas=True) for queryData in queryData_list])
|
|
|
+
|
|
|
minChar = pointerlist["pitxt"].min()
|
|
|
maxChar = pointerlist["pitxt"].max()
|
|
|
+
|
|
|
fileQueryData = {'sigla': sigla, 'minChar': minChar, 'maxChar': maxChar}
|
|
|
- minChar_list.append(minChar)
|
|
|
- maxChar_list.append(maxChar)
|
|
|
+
|
|
|
cont, form = self.queryHandler.textQuery(fileQueryData, True)
|
|
|
- contexts.append(cont)
|
|
|
- formats.append(json.dumps(form))
|
|
|
-
|
|
|
-
|
|
|
-
|
|
|
- '''for ind, row in textlist.iterrows():
|
|
|
- sigla = row["sigla"]
|
|
|
- queryData = {'queryType': 'contexts', 'ntxlocal': row["ntx"], 'mappalocal': row['mappa'], 'parole': parole}
|
|
|
- pointerlist = pd.DataFrame()
|
|
|
- for table in listOcc:
|
|
|
- queryData['table'] = table
|
|
|
- queryresponse = self.queryHandler.query(queryData, pandas=True)
|
|
|
- pointerlist = pd.concat([pointerlist, queryresponse])
|
|
|
- minChar = pointerlist["pitxt"].min()
|
|
|
- maxChar = pointerlist["pitxt"].max()
|
|
|
- fileQueryData = {'sigla': sigla, 'minChar': minChar, 'maxChar': maxChar}
|
|
|
+
|
|
|
minChar_list.append(minChar)
|
|
|
maxChar_list.append(maxChar)
|
|
|
- cont, form = self.queryHandler.textQuery(fileQueryData, True)
|
|
|
contexts.append(cont)
|
|
|
- formats.append(json.dumps(form))'''
|
|
|
-
|
|
|
+ formats.append(json.dumps(form))
|
|
|
+
|
|
|
textlist['piniz'] = minChar_list
|
|
|
textlist['pifin'] = maxChar_list
|
|
|
textlist['contesto'] = contexts
|
|
|
textlist['format contesto'] = formats
|
|
|
- return (textlist.reset_index(drop=True))
|
|
|
+ return textlist.reset_index(drop=True)
|
|
|
|
|
|
|
|
|
def findbib(self, contexts):
|