|
@@ -0,0 +1,85 @@
|
|
|
+
|
|
|
+import sqlite3
|
|
|
+import pandas as pd
|
|
|
+import dtale
|
|
|
+import unicodedata
|
|
|
+from simple_query_test_pandas import ricercaforme
|
|
|
+from simple_query_test_pandas import ricercalemmi
|
|
|
+from simple_query_test_pandas import ricercaformelemmi
|
|
|
+from simple_query_test_pandas import ricercalemmiforme
|
|
|
+from simple_query_test_pandas import inizialeraddoppiata
|
|
|
+from simple_query_test_pandas import interpreter
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+parola = "dare"
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+search=ricercaforme(interpreter(parola), "../", 0, 0)
|
|
|
+print(search)
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+listOcc = ["occ00001", "occ00002", "occ00003"]
|
|
|
+
|
|
|
+def findtexts (df, listOcc, path):
|
|
|
+ codelist = df[['cod']]
|
|
|
+ textlist = pd.DataFrame()
|
|
|
+ con = sqlite3.connect("file:" + path + "/db/test1.db" + "?mode=ro", uri=True)
|
|
|
+ for table in listOcc:
|
|
|
+ for res in codelist:
|
|
|
+ expandedQuery = "SELECT tab.ntx, tab.pitxt, tab.elemlen, intbib.sigla FROM " + table + " AS tab INNER JOIN intbib ON tab.ntx = intbib.ntx WHERE cod=" + res
|
|
|
+ extendequeryReponse = pd.read_sql(expandedQuery, con)
|
|
|
+ textlist = pd.concat([textlist, extendequeryReponse])
|
|
|
+ return textlist
|
|
|
+
|
|
|
+textlist=findtexts(search, listOcc, "../")
|
|
|
+print(textlist)
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+def findcontexts (textlist, charOffsetConst):
|
|
|
+ print(textlist)
|
|
|
+ contexts = []
|
|
|
+ for ind, row in textlist.iterrows():
|
|
|
+ print (row["ntx"], row ['sigla'])
|
|
|
+ ntxLocal = row["ntx"]
|
|
|
+ pitxtLocal = row["pitxt"]
|
|
|
+ sigla = row["sigla"]
|
|
|
+ print('Indice: ' + str(pitxtLocal))
|
|
|
+ print('Sigla: ' + sigla)
|
|
|
+
|
|
|
+ with open("../db/itxt/" + sigla, 'r', encoding="utf-32-le") as file1:
|
|
|
+ file1.seek( max( 4*(pitxtLocal-charOffsetConst), 0), 0 )
|
|
|
+ cont = file1.read(textlist['elemlen'][ind]+2*charOffsetConst)
|
|
|
+ contexts.append(cont)
|
|
|
+ return (contexts)
|
|
|
+
|
|
|
+charOffsetConst = int(100)
|
|
|
+contexts = findcontexts(textlist, charOffsetConst)
|
|
|
+print(contexts)
|
|
|
+
|
|
|
+print()
|
|
|
+for ii, cont in enumerate(contexts):
|
|
|
+ print(str(ii+1) + ":")
|
|
|
+ print(cont)
|
|
|
+ print()
|
|
|
+
|
|
|
+
|
|
|
+closeConn(cur1)
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+with open("../db/itxt/p07", 'r', encoding="utf-32-le") as file:
|
|
|
+ pyppa = file.read()
|
|
|
+
|
|
|
+print( pyppa[int(res2[0][1])-20:int(res2[0][1])+20] )
|
|
|
+print()
|
|
|
+print( pyppa[int(res2[1][1])-20:int(res2[1][1])+20] )
|
|
|
+
|