Spaces:

sharsh02
/

StockX-Mixtral8x7B

Running

App Files Files

sharsh02 commited on 26 days ago

Commit

e71e232

•

1 Parent(s): 2f3a946

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -6

app.py CHANGED Viewed

@@ -61,7 +61,7 @@ async def latest_earning():
     url = "https://www.moneycontrol.com/markets/earnings/india-inc-earnings/?selected=all"
     # Send a GET request to fetch the raw HTML content
-    response = requests.get(url)
     # Parse the content using BeautifulSoup
     soup = BeautifulSoup(response.content, "html.parser")
@@ -83,7 +83,7 @@ async def todays_news():
     url = 'https://trendlyne.com/markets-today/'
     # logging.info("getting news from %s", url)
     # Fetch the HTML content of the webpage
-    html_content = requests.get(url).text
     soup = BeautifulSoup(html_content, 'html.parser')
     insights = soup.find_all(class_='insight-box')
@@ -210,7 +210,7 @@ def get_the_ticker(stock_name):
             url = f'https://www.google.com/search?q={query}&FORM=HDRSC7'
             # logging.info("searching ticker using url: %s",url)
             # Fetch the HTML content of the webpage
-            html_content = requests.get(url).text  # Fix: Added .text to access the response text
             soup = BeautifulSoup(html_content, "html.parser")
             pattern = re.compile(r'(\w+%[0-9A-Fa-f]{2}(?:[0-9A-Fa-f]{2}|[0-9A-Fa-f])*|[\w\.&%-]+)\.NS')  # This pattern matches any word followed by .NS
             matches = pattern.findall(str(soup))
@@ -230,7 +230,7 @@ async def get_the_ticker_stat(stock):
         url = f'https://www.google.com/search?q={urllib.parse.quote(stock)}+site:businesstoday.in/stocks/&num=1&sca_esv=28795b6719ac1a08&sxsrf=ACQVn08xDA1EP1V6hJ-q4jLjjXSWWxgHTw:1711450545062&source=lnt&tbs=li:1&sa=X&ved=2ahUKEwj426eO4pGFAxX4n2MGHRXqBTUQpwV6BAgBEBM&biw=1280&bih=567&dpr=1.5'
         # logging.info("getting ticker stat url from: %s", url)
         # Fetch the HTML content of the webpage
-        html_content = requests.get(url).text  # Fix: Added .text to access the response text
         pattern = r'href="/url[?]q=(https://www.businesstoday.in/stocks/[^"]+)"'
         # Find all matches using re.findall
         links = re.findall(pattern, html_content)
@@ -239,7 +239,7 @@ async def get_the_ticker_stat(stock):
         url = (links[0].split("&"))[0]
         # logging.info("Final URL to fetch stats %s" , url)
         # Fetch the HTML content of the webpage
-        html_content = requests.get(url).text
         soup = BeautifulSoup(html_content, "html.parser")
         script = soup.find("script", type="application/ld+json")
@@ -270,7 +270,7 @@ async def get_the_ticker_news(stock):
         url = f'https://www.google.com/search?q={urllib.parse.quote(stock)}+site:trendlyne.com/research-reports&num=3&sca_esv=28795b6719ac1a08&sxsrf=ACQVn08xDA1EP1V6hJ-q4jLjjXSWWxgHTw:1711450545062&source=lnt&tbs=li:1&sa=X&ved=2ahUKEwj426eO4pGFAxX4n2MGHRXqBTUQpwV6BAgBEBM&biw=1280&bih=567&dpr=1.5'
         # logging.info(url)
         # Fetch the HTML content of the webpage
-        html_content = requests.get(url).text  # Fix: Added .text to access the response text
         pattern = r'href="/url[?]q=(https://trendlyne.com/research-reports/[^"]+)"'
         # Find all matches using re.findall
         links = re.findall(pattern, html_content)

     url = "https://www.moneycontrol.com/markets/earnings/india-inc-earnings/?selected=all"
     # Send a GET request to fetch the raw HTML content
+    response = requests.get(url,headers={'User-Agent': 'Mozilla/5.0'})
     # Parse the content using BeautifulSoup
     soup = BeautifulSoup(response.content, "html.parser")
     url = 'https://trendlyne.com/markets-today/'
     # logging.info("getting news from %s", url)
     # Fetch the HTML content of the webpage
+    html_content = requests.get(url,headers={'User-Agent': 'Mozilla/5.0'}).text
     soup = BeautifulSoup(html_content, 'html.parser')
     insights = soup.find_all(class_='insight-box')
             url = f'https://www.google.com/search?q={query}&FORM=HDRSC7'
             # logging.info("searching ticker using url: %s",url)
             # Fetch the HTML content of the webpage
+            html_content = requests.get(url,headers={'User-Agent': 'Mozilla/5.0'}).text  # Fix: Added .text to access the response text
             soup = BeautifulSoup(html_content, "html.parser")
             pattern = re.compile(r'(\w+%[0-9A-Fa-f]{2}(?:[0-9A-Fa-f]{2}|[0-9A-Fa-f])*|[\w\.&%-]+)\.NS')  # This pattern matches any word followed by .NS
             matches = pattern.findall(str(soup))
         url = f'https://www.google.com/search?q={urllib.parse.quote(stock)}+site:businesstoday.in/stocks/&num=1&sca_esv=28795b6719ac1a08&sxsrf=ACQVn08xDA1EP1V6hJ-q4jLjjXSWWxgHTw:1711450545062&source=lnt&tbs=li:1&sa=X&ved=2ahUKEwj426eO4pGFAxX4n2MGHRXqBTUQpwV6BAgBEBM&biw=1280&bih=567&dpr=1.5'
         # logging.info("getting ticker stat url from: %s", url)
         # Fetch the HTML content of the webpage
+        html_content = requests.get(url,headers={'User-Agent': 'Mozilla/5.0'}).text  # Fix: Added .text to access the response text
         pattern = r'href="/url[?]q=(https://www.businesstoday.in/stocks/[^"]+)"'
         # Find all matches using re.findall
         links = re.findall(pattern, html_content)
         url = (links[0].split("&"))[0]
         # logging.info("Final URL to fetch stats %s" , url)
         # Fetch the HTML content of the webpage
+        html_content = requests.get(url,headers={'User-Agent': 'Mozilla/5.0'}).text
         soup = BeautifulSoup(html_content, "html.parser")
         script = soup.find("script", type="application/ld+json")
         url = f'https://www.google.com/search?q={urllib.parse.quote(stock)}+site:trendlyne.com/research-reports&num=3&sca_esv=28795b6719ac1a08&sxsrf=ACQVn08xDA1EP1V6hJ-q4jLjjXSWWxgHTw:1711450545062&source=lnt&tbs=li:1&sa=X&ved=2ahUKEwj426eO4pGFAxX4n2MGHRXqBTUQpwV6BAgBEBM&biw=1280&bih=567&dpr=1.5'
         # logging.info(url)
         # Fetch the HTML content of the webpage
+        html_content = requests.get(url,headers={'User-Agent': 'Mozilla/5.0'}).text  # Fix: Added .text to access the response text
         pattern = r'href="/url[?]q=(https://trendlyne.com/research-reports/[^"]+)"'
         # Find all matches using re.findall
         links = re.findall(pattern, html_content)