Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
|
@@ -314,71 +314,74 @@ def find_rss():
|
|
| 314 |
cont = json.loads(j.read())
|
| 315 |
#print(cont)
|
| 316 |
for ea in cont:
|
| 317 |
-
#lod=""
|
| 318 |
-
#print (ea['link'])
|
| 319 |
-
if ea.get('link') is not None:
|
| 320 |
-
|
| 321 |
-
rss_url=ea['link']
|
| 322 |
-
else:
|
| 323 |
-
rss_url=ea['URL']
|
| 324 |
-
link_box=[]
|
| 325 |
-
r = requests.get(f'{rss_url}')
|
| 326 |
-
if r.status_code == 200:
|
| 327 |
-
try:
|
| 328 |
-
if ".json" in rss_url:
|
| 329 |
-
lod = json.loads(r.text)
|
| 330 |
-
if ".xml" in rss_url:
|
| 331 |
-
lod = xmltodict.parse(r.content)
|
| 332 |
-
if ".rss" in rss_url:
|
| 333 |
-
lod = xmltodict.parse(r.content)
|
| 334 |
-
else:
|
| 335 |
-
try:
|
| 336 |
-
lod = xmltodict.parse(r.content)
|
| 337 |
-
except Exception as e:
|
| 338 |
-
lod=f'{rss_url} ::ERROR:: {e}'
|
| 339 |
-
error_box.append({"Name":rss_url,"Error":e,"Error Code":1})
|
| 340 |
-
|
| 341 |
-
except Exception as e:
|
| 342 |
-
lod=f'{rss_url} ::ERROR:: {e}'
|
| 343 |
-
error_box.append({"Name":rss_url,"Error":e,"Error Code":2})
|
| 344 |
-
|
| 345 |
-
else:
|
| 346 |
-
lod = f'{rss_url} ::ERROR::COULD NOT CONNECT:: {r.status_code}'
|
| 347 |
-
error_box.append({"Name":rss_url,"Error":f'Status Code:{r.status_code}',"Error Code":3})
|
| 348 |
-
pass
|
| 349 |
try:
|
| 350 |
-
|
| 351 |
-
print(
|
| 352 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 353 |
try:
|
| 354 |
-
|
| 355 |
-
|
| 356 |
-
|
| 357 |
-
|
| 358 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 359 |
try:
|
| 360 |
r_link = ea['link']
|
| 361 |
-
r_title = ea['
|
| 362 |
-
r_description = '
|
| 363 |
lods = {"title":r_title, "description":r_description,"link":r_link}
|
| 364 |
-
except Exception
|
| 365 |
-
|
| 366 |
-
|
| 367 |
-
|
| 368 |
-
|
| 369 |
-
|
| 370 |
-
|
| 371 |
-
|
| 372 |
-
|
| 373 |
-
|
| 374 |
-
|
| 375 |
-
|
| 376 |
-
|
| 377 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 378 |
except Exception as e:
|
| 379 |
-
error_box.append({"Name":rss_url,"Error":e,"Error Code":
|
| 380 |
print(f'Exception::{e}')
|
| 381 |
-
print(f'Exception::{ea.keys()}')
|
| 382 |
|
| 383 |
#user_repo=save_data.split('datasets/',1)[1].split('/raw',1)[0]
|
| 384 |
timestamp=str(datetime.datetime.now())
|
|
|
|
| 314 |
cont = json.loads(j.read())
|
| 315 |
#print(cont)
|
| 316 |
for ea in cont:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 317 |
try:
|
| 318 |
+
#lod=""
|
| 319 |
+
#print (ea['link'])
|
| 320 |
+
if ea.get('link') is not None:
|
| 321 |
+
|
| 322 |
+
rss_url=ea['link']
|
| 323 |
+
else:
|
| 324 |
+
rss_url=ea['URL']
|
| 325 |
+
link_box=[]
|
| 326 |
+
r = requests.get(f'{rss_url}')
|
| 327 |
+
if r.status_code == 200:
|
| 328 |
try:
|
| 329 |
+
if ".json" in rss_url:
|
| 330 |
+
lod = json.loads(r.text)
|
| 331 |
+
if ".xml" in rss_url:
|
| 332 |
+
lod = xmltodict.parse(r.content)
|
| 333 |
+
if ".rss" in rss_url:
|
| 334 |
+
lod = xmltodict.parse(r.content)
|
| 335 |
+
else:
|
| 336 |
+
try:
|
| 337 |
+
lod = xmltodict.parse(r.content)
|
| 338 |
+
except Exception as e:
|
| 339 |
+
lod=f'{rss_url} ::ERROR:: {e}'
|
| 340 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":1})
|
| 341 |
+
|
| 342 |
+
except Exception as e:
|
| 343 |
+
lod=f'{rss_url} ::ERROR:: {e}'
|
| 344 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":2})
|
| 345 |
+
|
| 346 |
+
else:
|
| 347 |
+
lod = f'{rss_url} ::ERROR::COULD NOT CONNECT:: {r.status_code}'
|
| 348 |
+
error_box.append({"Name":rss_url,"Error":f'Status Code:{r.status_code}',"Error Code":3})
|
| 349 |
+
pass
|
| 350 |
+
try:
|
| 351 |
+
print(lod['rss']['channel']['item'][0].keys())
|
| 352 |
+
print(lod['rss'].keys())
|
| 353 |
+
for i,ea in enumerate(lod['rss']['channel']['item']):
|
| 354 |
try:
|
| 355 |
r_link = ea['link']
|
| 356 |
+
r_title = ea['title']
|
| 357 |
+
r_description = ea['description']
|
| 358 |
lods = {"title":r_title, "description":r_description,"link":r_link}
|
| 359 |
+
except Exception:
|
| 360 |
+
try:
|
| 361 |
+
r_link = ea['link']
|
| 362 |
+
r_title = ea['source']
|
| 363 |
+
r_description = 'No Description provided'
|
| 364 |
+
lods = {"title":r_title, "description":r_description,"link":r_link}
|
| 365 |
+
except Exception as e:
|
| 366 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":4})
|
| 367 |
+
print(e)
|
| 368 |
+
pass
|
| 369 |
+
#lods = {"title":"ERROR", "description":{e},"link":"ERROR"}
|
| 370 |
+
|
| 371 |
+
"""
|
| 372 |
+
r_link = lod['rss']['channel']['item'][i]['link']
|
| 373 |
+
r_title = lod['rss']['channel']['item'][i]['title']
|
| 374 |
+
r_description = lod['rss']['channel']['item'][i]['description']"""
|
| 375 |
+
link_box.append(lods)
|
| 376 |
+
lod={lod['rss']['channel']['title']:link_box}
|
| 377 |
+
out_box.append(lod)
|
| 378 |
+
|
| 379 |
+
except Exception as e:
|
| 380 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":5})
|
| 381 |
+
print(f'Exception::{e}')
|
| 382 |
except Exception as e:
|
| 383 |
+
error_box.append({"Name":rss_url,"Error":e,"Error Code":6})
|
| 384 |
print(f'Exception::{e}')
|
|
|
|
| 385 |
|
| 386 |
#user_repo=save_data.split('datasets/',1)[1].split('/raw',1)[0]
|
| 387 |
timestamp=str(datetime.datetime.now())
|