Spaces:

MojoHz
/

Dija_Grad_Work

Sleeping

App Files Files Community

MojoHz commited on Jan 10

Commit

5aa5b9a

verified ·

1 Parent(s): 35cfda2

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -10

app.py CHANGED Viewed

@@ -69,12 +69,12 @@ def download_youtube_video(video_url, output_dir, title=None):
 def fetch_and_download_youtube_video(query, output_dir="./downloads"):
     """Fetch and download the best YouTube video for a query."""
     ydl_opts = {
-        'quiet': True,
-        'noplaylist': True,
-        'default_search': 'ytsearch',
-        'max_downloads': 1,
-        'skip_download': True,
-    }
     try:
         with YoutubeDL(ydl_opts) as ydl:
             search_results = ydl.extract_info(query, download=False)
@@ -87,28 +87,37 @@ def fetch_and_download_youtube_video(query, output_dir="./downloads"):
         print(f"Error fetching YouTube video for query '{query}': {e}")
         return []
 def fetch_from_arxiv(query="machine learning", max_results=2, output_dir="./papers"):
     """Fetch papers from arXiv and download their PDFs."""
-    search = arxiv.Search(
         query=query,
         max_results=max_results,
-        sort_by=arxiv.SortCriterion.Relevance
     )
     metadata = []
-    for i, result in enumerate(search.results()):
-        pdf_url = result.pdf_url
         filename = f"{query.replace(' ', '_')}_arxiv_{i}.pdf"
         local_path = os.path.join(output_dir, filename)
         try:
             response = requests.get(pdf_url)
             if response.status_code == 200:
                 with open(local_path, 'wb') as f:
                     f.write(response.content)
                 metadata.append({"title": result.title, "url": pdf_url, "file_path": local_path, "type": "paper"})
         except Exception as e:
             print(f"Error downloading paper: {e}")
     return metadata
 def generate_llama_response(query, context=None):
     """Generate a response using LLaMA 2."""
     input_text = f"Query: {query}\n"

 def fetch_and_download_youtube_video(query, output_dir="./downloads"):
     """Fetch and download the best YouTube video for a query."""
     ydl_opts = {
+    'quiet': True,
+    'outtmpl': f"{output_dir}/{sanitized_title}.%(ext)s",
+    'format': 'best',
+    'cookiesfrombrowser': ('chrome',),  # Adjust for your browser (e.g., 'firefox', 'edge')
+}
     try:
         with YoutubeDL(ydl_opts) as ydl:
             search_results = ydl.extract_info(query, download=False)
         print(f"Error fetching YouTube video for query '{query}': {e}")
         return []
+from arxiv import Client, Search, SortCriterion
 def fetch_from_arxiv(query="machine learning", max_results=2, output_dir="./papers"):
     """Fetch papers from arXiv and download their PDFs."""
+    print(f"Fetching papers for query: {query}")
+    client = Client()
+    search = Search(
         query=query,
         max_results=max_results,
+        sort_by=SortCriterion.Relevance
     )
     metadata = []
+    for i, result in enumerate(client.results(search)):
+        pdf_url = result.pdf_url  # Direct link to PDF
         filename = f"{query.replace(' ', '_')}_arxiv_{i}.pdf"
         local_path = os.path.join(output_dir, filename)
         try:
+            # Download the PDF
             response = requests.get(pdf_url)
             if response.status_code == 200:
                 with open(local_path, 'wb') as f:
                     f.write(response.content)
+                print(f"Downloaded paper: {filename}")
                 metadata.append({"title": result.title, "url": pdf_url, "file_path": local_path, "type": "paper"})
+            else:
+                print(f"Failed to download paper: {pdf_url}. Status code: {response.status_code}")
         except Exception as e:
             print(f"Error downloading paper: {e}")
     return metadata
 def generate_llama_response(query, context=None):
     """Generate a response using LLaMA 2."""
     input_text = f"Query: {query}\n"