Spaces:
Sleeping
Sleeping
Update tsadropboxretrieval.py
Browse files- tsadropboxretrieval.py +14 -7
tsadropboxretrieval.py
CHANGED
|
@@ -55,7 +55,7 @@ def getSharedLink(path):
|
|
| 55 |
shared_link_metadata=dbxTeam.sharing_create_shared_link(path)
|
| 56 |
return shared_link_metadata.url
|
| 57 |
|
| 58 |
-
def handle_entries(entries):
|
| 59 |
|
| 60 |
for file in entries:
|
| 61 |
if isinstance(file, dropbox.files.FileMetadata):
|
|
@@ -66,6 +66,7 @@ def handle_entries(entries):
|
|
| 66 |
'client_modified': file.client_modified,
|
| 67 |
'server_modified': file.server_modified
|
| 68 |
}
|
|
|
|
| 69 |
files_list.append(metadata)
|
| 70 |
df = pd.DataFrame.from_records(files_list)
|
| 71 |
return df
|
|
@@ -115,18 +116,22 @@ def uploadanyFile(doc,pdfname,path):
|
|
| 115 |
|
| 116 |
return 'Error uploading file to Dropbox.'
|
| 117 |
|
|
|
|
| 118 |
# Call when the dropbox is updated with new items - if not , call parquet saved version of the df of saved items
|
| 119 |
def DropboxItemstoDF():
|
|
|
|
| 120 |
dbxTeam=ADR_Access_DropboxTeam('user') # or pass dbx in parameters
|
| 121 |
folder_path = "/TSA Team Folder"
|
| 122 |
-
res = dbxTeam.files_list_folder(path=folder_path, recursive=True)
|
| 123 |
-
# df1=handle_entries(res.entries)
|
| 124 |
-
|
| 125 |
-
|
| 126 |
-
|
|
|
|
| 127 |
|
| 128 |
# dbxTeam=dropbox_upload_file(df2)
|
| 129 |
-
|
|
|
|
| 130 |
|
| 131 |
# df2=DropboxItemstoDF()
|
| 132 |
|
|
@@ -169,7 +174,9 @@ def getPDFData(path):
|
|
| 169 |
return data
|
| 170 |
|
| 171 |
def retrieveProjects(projname):
|
|
|
|
| 172 |
parquetDf=GetParquetDF()
|
|
|
|
| 173 |
documentsToMeasure=[]
|
| 174 |
RelevantDocuments=[]
|
| 175 |
projnameWithDetails=''
|
|
|
|
| 55 |
shared_link_metadata=dbxTeam.sharing_create_shared_link(path)
|
| 56 |
return shared_link_metadata.url
|
| 57 |
|
| 58 |
+
def handle_entries(entries , files_list):
|
| 59 |
|
| 60 |
for file in entries:
|
| 61 |
if isinstance(file, dropbox.files.FileMetadata):
|
|
|
|
| 66 |
'client_modified': file.client_modified,
|
| 67 |
'server_modified': file.server_modified
|
| 68 |
}
|
| 69 |
+
|
| 70 |
files_list.append(metadata)
|
| 71 |
df = pd.DataFrame.from_records(files_list)
|
| 72 |
return df
|
|
|
|
| 116 |
|
| 117 |
return 'Error uploading file to Dropbox.'
|
| 118 |
|
| 119 |
+
# Call when the dropbox is updated with new items - if not , call parquet saved version of the df of saved items
|
| 120 |
# Call when the dropbox is updated with new items - if not , call parquet saved version of the df of saved items
|
| 121 |
def DropboxItemstoDF():
|
| 122 |
+
files_list=[]
|
| 123 |
dbxTeam=ADR_Access_DropboxTeam('user') # or pass dbx in parameters
|
| 124 |
folder_path = "/TSA Team Folder"
|
| 125 |
+
res = dbxTeam.files_list_folder(path=folder_path, recursive=True )
|
| 126 |
+
# df1=handle_entries(res.entries , files_list)
|
| 127 |
+
if res.has_more:
|
| 128 |
+
while res.has_more:
|
| 129 |
+
res = dbxTeam.files_list_folder_continue(cursor=res.cursor)
|
| 130 |
+
df2=handle_entries(res.entries , files_list)
|
| 131 |
|
| 132 |
# dbxTeam=dropbox_upload_file(df2)
|
| 133 |
+
print(df2)
|
| 134 |
+
return df2 , files_list
|
| 135 |
|
| 136 |
# df2=DropboxItemstoDF()
|
| 137 |
|
|
|
|
| 174 |
return data
|
| 175 |
|
| 176 |
def retrieveProjects(projname):
|
| 177 |
+
print('retrieve')
|
| 178 |
parquetDf=GetParquetDF()
|
| 179 |
+
print('p',parquetDf)
|
| 180 |
documentsToMeasure=[]
|
| 181 |
RelevantDocuments=[]
|
| 182 |
projnameWithDetails=''
|