Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
@@ -314,71 +314,74 @@ def find_rss():
|
|
314 |
cont = json.loads(j.read())
|
315 |
#print(cont)
|
316 |
for ea in cont:
|
317 |
-
#lod=""
|
318 |
-
#print (ea['link'])
|
319 |
-
if ea.get('link') is not None:
|
320 |
-
|
321 |
-
rss_url=ea['link']
|
322 |
-
else:
|
323 |
-
rss_url=ea['URL']
|
324 |
-
link_box=[]
|
325 |
-
r = requests.get(f'{rss_url}')
|
326 |
-
if r.status_code == 200:
|
327 |
-
try:
|
328 |
-
if ".json" in rss_url:
|
329 |
-
lod = json.loads(r.text)
|
330 |
-
if ".xml" in rss_url:
|
331 |
-
lod = xmltodict.parse(r.content)
|
332 |
-
if ".rss" in rss_url:
|
333 |
-
lod = xmltodict.parse(r.content)
|
334 |
-
else:
|
335 |
-
try:
|
336 |
-
lod = xmltodict.parse(r.content)
|
337 |
-
except Exception as e:
|
338 |
-
lod=f'{rss_url} ::ERROR:: {e}'
|
339 |
-
error_box.append({"Name":rss_url,"Error":e,"Error Code":1})
|
340 |
-
|
341 |
-
except Exception as e:
|
342 |
-
lod=f'{rss_url} ::ERROR:: {e}'
|
343 |
-
error_box.append({"Name":rss_url,"Error":e,"Error Code":2})
|
344 |
-
|
345 |
-
else:
|
346 |
-
lod = f'{rss_url} ::ERROR::COULD NOT CONNECT:: {r.status_code}'
|
347 |
-
error_box.append({"Name":rss_url,"Error":f'Status Code:{r.status_code}',"Error Code":3})
|
348 |
-
pass
|
349 |
try:
|
350 |
-
|
351 |
-
print(
|
352 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
353 |
try:
|
354 |
-
|
355 |
-
|
356 |
-
|
357 |
-
|
358 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
359 |
try:
|
360 |
r_link = ea['link']
|
361 |
-
r_title = ea['
|
362 |
-
r_description = '
|
363 |
lods = {"title":r_title, "description":r_description,"link":r_link}
|
364 |
-
except Exception
|
365 |
-
|
366 |
-
|
367 |
-
|
368 |
-
|
369 |
-
|
370 |
-
|
371 |
-
|
372 |
-
|
373 |
-
|
374 |
-
|
375 |
-
|
376 |
-
|
377 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
378 |
except Exception as e:
|
379 |
-
error_box.append({"Name":rss_url,"Error":e,"Error Code":
|
380 |
print(f'Exception::{e}')
|
381 |
-
print(f'Exception::{ea.keys()}')
|
382 |
|
383 |
#user_repo=save_data.split('datasets/',1)[1].split('/raw',1)[0]
|
384 |
timestamp=str(datetime.datetime.now())
|
|
|
314 |
cont = json.loads(j.read())
|
315 |
#print(cont)
|
316 |
for ea in cont:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
317 |
try:
|
318 |
+
#lod=""
|
319 |
+
#print (ea['link'])
|
320 |
+
if ea.get('link') is not None:
|
321 |
+
|
322 |
+
rss_url=ea['link']
|
323 |
+
else:
|
324 |
+
rss_url=ea['URL']
|
325 |
+
link_box=[]
|
326 |
+
r = requests.get(f'{rss_url}')
|
327 |
+
if r.status_code == 200:
|
328 |
try:
|
329 |
+
if ".json" in rss_url:
|
330 |
+
lod = json.loads(r.text)
|
331 |
+
if ".xml" in rss_url:
|
332 |
+
lod = xmltodict.parse(r.content)
|
333 |
+
if ".rss" in rss_url:
|
334 |
+
lod = xmltodict.parse(r.content)
|
335 |
+
else:
|
336 |
+
try:
|
337 |
+
lod = xmltodict.parse(r.content)
|
338 |
+
except Exception as e:
|
339 |
+
lod=f'{rss_url} ::ERROR:: {e}'
|
340 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":1})
|
341 |
+
|
342 |
+
except Exception as e:
|
343 |
+
lod=f'{rss_url} ::ERROR:: {e}'
|
344 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":2})
|
345 |
+
|
346 |
+
else:
|
347 |
+
lod = f'{rss_url} ::ERROR::COULD NOT CONNECT:: {r.status_code}'
|
348 |
+
error_box.append({"Name":rss_url,"Error":f'Status Code:{r.status_code}',"Error Code":3})
|
349 |
+
pass
|
350 |
+
try:
|
351 |
+
print(lod['rss']['channel']['item'][0].keys())
|
352 |
+
print(lod['rss'].keys())
|
353 |
+
for i,ea in enumerate(lod['rss']['channel']['item']):
|
354 |
try:
|
355 |
r_link = ea['link']
|
356 |
+
r_title = ea['title']
|
357 |
+
r_description = ea['description']
|
358 |
lods = {"title":r_title, "description":r_description,"link":r_link}
|
359 |
+
except Exception:
|
360 |
+
try:
|
361 |
+
r_link = ea['link']
|
362 |
+
r_title = ea['source']
|
363 |
+
r_description = 'No Description provided'
|
364 |
+
lods = {"title":r_title, "description":r_description,"link":r_link}
|
365 |
+
except Exception as e:
|
366 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":4})
|
367 |
+
print(e)
|
368 |
+
pass
|
369 |
+
#lods = {"title":"ERROR", "description":{e},"link":"ERROR"}
|
370 |
+
|
371 |
+
"""
|
372 |
+
r_link = lod['rss']['channel']['item'][i]['link']
|
373 |
+
r_title = lod['rss']['channel']['item'][i]['title']
|
374 |
+
r_description = lod['rss']['channel']['item'][i]['description']"""
|
375 |
+
link_box.append(lods)
|
376 |
+
lod={lod['rss']['channel']['title']:link_box}
|
377 |
+
out_box.append(lod)
|
378 |
+
|
379 |
+
except Exception as e:
|
380 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":5})
|
381 |
+
print(f'Exception::{e}')
|
382 |
except Exception as e:
|
383 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":6})
|
384 |
print(f'Exception::{e}')
|
|
|
385 |
|
386 |
#user_repo=save_data.split('datasets/',1)[1].split('/raw',1)[0]
|
387 |
timestamp=str(datetime.datetime.now())
|