Marthee commited on
Commit
bdcaad1
·
verified ·
1 Parent(s): 121d16c

Update tsadropboxretrieval.py

Browse files
Files changed (1) hide show
  1. tsadropboxretrieval.py +14 -7
tsadropboxretrieval.py CHANGED
@@ -55,7 +55,7 @@ def getSharedLink(path):
55
  shared_link_metadata=dbxTeam.sharing_create_shared_link(path)
56
  return shared_link_metadata.url
57
 
58
- def handle_entries(entries):
59
 
60
  for file in entries:
61
  if isinstance(file, dropbox.files.FileMetadata):
@@ -66,6 +66,7 @@ def handle_entries(entries):
66
  'client_modified': file.client_modified,
67
  'server_modified': file.server_modified
68
  }
 
69
  files_list.append(metadata)
70
  df = pd.DataFrame.from_records(files_list)
71
  return df
@@ -115,18 +116,22 @@ def uploadanyFile(doc,pdfname,path):
115
 
116
  return 'Error uploading file to Dropbox.'
117
 
 
118
  # Call when the dropbox is updated with new items - if not , call parquet saved version of the df of saved items
119
  def DropboxItemstoDF():
 
120
  dbxTeam=ADR_Access_DropboxTeam('user') # or pass dbx in parameters
121
  folder_path = "/TSA Team Folder"
122
- res = dbxTeam.files_list_folder(path=folder_path, recursive=True)
123
- # df1=handle_entries(res.entries)
124
- while res.has_more:
125
- res = dbxTeam.files_list_folder_continue(cursor=res.cursor)
126
- df2=handle_entries(res.entries)
 
127
 
128
  # dbxTeam=dropbox_upload_file(df2)
129
- return df2
 
130
 
131
  # df2=DropboxItemstoDF()
132
 
@@ -169,7 +174,9 @@ def getPDFData(path):
169
  return data
170
 
171
  def retrieveProjects(projname):
 
172
  parquetDf=GetParquetDF()
 
173
  documentsToMeasure=[]
174
  RelevantDocuments=[]
175
  projnameWithDetails=''
 
55
  shared_link_metadata=dbxTeam.sharing_create_shared_link(path)
56
  return shared_link_metadata.url
57
 
58
+ def handle_entries(entries , files_list):
59
 
60
  for file in entries:
61
  if isinstance(file, dropbox.files.FileMetadata):
 
66
  'client_modified': file.client_modified,
67
  'server_modified': file.server_modified
68
  }
69
+
70
  files_list.append(metadata)
71
  df = pd.DataFrame.from_records(files_list)
72
  return df
 
116
 
117
  return 'Error uploading file to Dropbox.'
118
 
119
+ # Call when the dropbox is updated with new items - if not , call parquet saved version of the df of saved items
120
  # Call when the dropbox is updated with new items - if not , call parquet saved version of the df of saved items
121
  def DropboxItemstoDF():
122
+ files_list=[]
123
  dbxTeam=ADR_Access_DropboxTeam('user') # or pass dbx in parameters
124
  folder_path = "/TSA Team Folder"
125
+ res = dbxTeam.files_list_folder(path=folder_path, recursive=True )
126
+ # df1=handle_entries(res.entries , files_list)
127
+ if res.has_more:
128
+ while res.has_more:
129
+ res = dbxTeam.files_list_folder_continue(cursor=res.cursor)
130
+ df2=handle_entries(res.entries , files_list)
131
 
132
  # dbxTeam=dropbox_upload_file(df2)
133
+ print(df2)
134
+ return df2 , files_list
135
 
136
  # df2=DropboxItemstoDF()
137
 
 
174
  return data
175
 
176
  def retrieveProjects(projname):
177
+ print('retrieve')
178
  parquetDf=GetParquetDF()
179
+ print('p',parquetDf)
180
  documentsToMeasure=[]
181
  RelevantDocuments=[]
182
  projnameWithDetails=''