bilal-mustafa10 · sethupavan12 · Nov 16, 2022 · Nov 17, 2022 · Nov 17, 2022 · Nov 17, 2022
diff --git a/.gitignore b/.gitignore
@@ -1 +1,6 @@
-nlp_backend/assets/data.csv
+nlp_backend/assets/cleanedDF.csv
+nlp_backend/__pycache__/__init__.cpython-310.pyc
+nlp_backend/__pycache__/settings.cpython-310.pyc
+nlp_backend/__pycache__/views.cpython-310.pyc
+nlp_backend/__pycache__/wsgi.cpython-310.pyc
+nlp_backend/__pycache__/urls.cpython-310.pyc
diff --git a/nlp_backend/__init__.py b/nlp_backend/__init__.py
@@ -1,3 +1,17 @@
+
+# import pandas as pd
+# from ast import literal_eval
+# from tqdm.notebook import tqdm
+# tqdm.pandas()
+# from datetime import datetime
+# from transformers import pipeline
+
+
+# data_path = "../assets/cleanedDF.csv"
+# df = pd.read_csv(data_path, sep='\t', converters={'doc_entities': literal_eval, 'doc_keyphrases': literal_eval})
+# interesting = df.drop(['id','doc_date', 'doc_title', 'doc_url', 'doc_entities', 'doc_keyphrases', 'doc_publish_location'], axis=1)
+# model_name = "deepset/roberta-base-squad2"
+# fb_ai = pipeline('question-answering', model=model_name, tokenizer=model_name)
 from ast import literal_eval
 
 import pandas as pd
@@ -14,4 +28,5 @@
 interesting.dropna()
 interesting['sentence'] = interesting['sentence'].fillna('')
 model_name = "deepset/roberta-base-squad2"
-fb_ai = pipeline('question-answering', model=model_name, tokenizer=model_name)
+fb_ai = pipeline('question-answering', model=model_name, tokenizer=model_name)
+
diff --git a/nlp_backend/asgi.py b/nlp_backend/asgi.py
@@ -13,4 +13,5 @@
 
 os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'nlp_backend.settings')
 
+
 application = get_asgi_application()
diff --git a/nlp_backend/views.py b/nlp_backend/views.py
@@ -2,6 +2,9 @@
 
 import pandas as pd
 from django.http import HttpResponse
+from nlp_backend import interesting, fb_ai
+
+
 from django.views.decorators.csrf import csrf_exempt
 from transformers import pipeline
 
@@ -104,18 +107,36 @@ def get_continent_dist_for_a_snack(snack):
     africa = [" South Africa", ' Nigeria', ' Kenya', ' Ghana', ' Zimbabwe', ' Trinidad and Tobago', ' Rwanda',
               ' Uganda', ' Tanzania']
 
-    africa_total = 0
-    for i in north_america:
-        north_america_total += len(df[(df['sentence'].str.contains(snack)) & (df['sentence'].str.contains(i))])
-    for i in south_america:
-        south_america_total += len(df[(df['sentence'].str.contains(snack)) & (df['sentence'].str.contains(i))])
-    for i in europe:
-        europe_total += len(df[(df['sentence'].str.contains(snack)) & (df['sentence'].str.contains(i))])
-    for i in africa:
-        africa_total += len(df[(df['sentence'].str.contains(snack)) & (df['sentence'].str.contains(i))])
-    asia_total = len(df[(df['sentence'].str.contains(snack)) & (df['sentence'].str.contains(' Asia'))])
-    answer = north_america_total, south_america_total, europe_total, asia_total, africa_total
-    # scale the data to total to 1
-    # make sure the answers are split into percentages of the total so that they can be compared
-    percent = [i * 100 / sum(answer) for i in answer]
+
+
+def return_highest_snack_country(request,snack):
+    if request.method == 'GET':
+        country = find_snack_highest_talked_country(snack)
+        return HttpResponse(json.dumps(country), content_type='application/json')
+
+
+# topic - "Walnuts" 
+# question - "What are some famous walnut types?"
+# answer - "Organic Walnuts and Organic Walnuts with Apple Cinnamon"
+def q_a_facebook(request, topic, question):
+    model_name = "deepset/roberta-base-squad2"
+    fb_ai = pipeline('question-answering', model=model_name, tokenizer=model_name)
+    sentences_topic = ' '.join(interesting[interesting['sentence'].str.contains(topic)]['sentence'])
+
+
+
+
+
+
+
+# Find highest talked of country
+def find_snack_highest_talked_country(snack):
+  countries = {}
+  for country in df['doc_publish_location'].unique():
+      countries[country] = df[df['doc_publish_location'] == country]['sentence'].str.contains(snack).sum()
+
+  # Find the country that has the highest count
+  return max(countries, key=countries.get)
+ * 100 / sum(answer) for i in answer]
     return percent
+
diff --git a/requirements.txt b/requirements.txt
@@ -0,0 +1,4 @@
+Django~=4.1.3
+transformers~=4.24.0
+pandas~=1.5.1
+tqdm~=4.64.1
Original file line number	Diff line number	Diff line change
Expand Up		@@ -13,4 +13,5 @@

		os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'nlp_backend.settings')


		application = get_asgi_application()