Spaces:

rafaldembski
/

ScamDetector

Sleeping

App Files Files Community

rafaldembski commited on Oct 2

Commit

6f95eac

•

1 Parent(s): 9899a9d

Update utils/functions.py

Browse files

Files changed (1) hide show

utils/functions.py +99 -23

utils/functions.py CHANGED Viewed

@@ -29,7 +29,7 @@ def load_json(file_path):
     """Ładuje dane z pliku JSON. Jeśli plik nie istnieje, zwraca pustą listę lub domyślny obiekt."""
     if not os.path.exists(file_path):
         if file_path.endswith('stats.json'):
-            return {"total_analyses": 0, "total_frauds_detected": 0}
         else:
             return []
     with open(file_path, 'r', encoding='utf-8') as file:
@@ -39,7 +39,7 @@ def load_json(file_path):
         except json.JSONDecodeError:
             logging.error(f"Nie można załadować danych z {file_path}. Plik jest uszkodzony.")
             if file_path.endswith('stats.json'):
-                return {"total_analyses": 0, "total_frauds_detected": 0}
             return []
 def save_json(file_path, data):
@@ -77,6 +77,7 @@ def add_to_history(message, phone_number, analysis, risk, recommendations):
     history = load_json(HISTORY_FILE)
     history.append({
         "timestamp": datetime.now().isoformat(),
         "message": message,
         "phone_number": phone_number,
         "analysis": analysis,
@@ -105,10 +106,11 @@ def update_stats(fraud_detected=False):
     """Aktualizuje statystyki analiz w pliku stats.json."""
     stats = load_json(STATS_FILE)
     stats["total_analyses"] += 1
     if fraud_detected:
         stats["total_frauds_detected"] += 1
     save_json(STATS_FILE, stats)
-    logging.info(f"Statystyki zostały zaktualizowane: Analiz {stats['total_analyses']}, Oszustw {stats['total_frauds_detected']}.")
 def get_stats():
     """Pobiera statystyki analiz z pliku stats.json."""
@@ -125,8 +127,8 @@ def get_phone_info(phone_number):
     """Weryfikuje numer telefonu i zwraca informacje o kraju i operatorze."""
     try:
         parsed_number = phonenumbers.parse(phone_number, None)
-        country = geocoder.description_for_number(parsed_number, 'pl')
-        operator = carrier.name_for_number(parsed_number, 'pl')
         if not country:
             country = "Nieznany"
         if not operator:
@@ -163,7 +165,7 @@ def analyze_message(message, phone_number, additional_info, api_key, language):
         logging.error("Brak klucza API.")
         return "Brak klucza API.", "Brak klucza API.", "Brak klucza API."
-    url = "https://api.sambanova.ai/v1/chat/completions"
     headers = {
         "Authorization": f"Bearer {api_key}",
         "Content-Type": "application/json"
@@ -177,53 +179,126 @@ Jesteś zaawansowanym asystentem AI specjalizującym się w identyfikacji fałsz
 **📝 Analiza Treści Wiadomości:**
 - Przeprowadź szczegółową analizę treści wiadomości, identyfikując potencjalne czerwone flagi, takie jak błędy językowe, prośby o dane osobowe, pilne prośby o kontakt itp.
 - Jakie elementy treści mogą wskazywać na oszustwo?
 </analysis>
 <risk_assessment>
 **⚖️ Ocena Ryzyka Oszustwa:**
 - Na podstawie analizy treści i dostępnych informacji oceń prawdopodobieństwo, że wiadomość jest oszustwem. Użyj skali od 1 do 10, gdzie 1 oznacza bardzo niskie ryzyko, a 10 bardzo wysokie ryzyko.
 </risk_assessment>
 <recommendations>
 **💡 Zalecenia dla Użytkownika:**
 - Podaj jasne i konkretne zalecenia dotyczące dalszych kroków, które użytkownik powinien podjąć.
 </recommendations>
         """,
         'German': """
-Du bist ein fortgeschrittener KI-Assistent, spezialisiert auf die Identifizierung gefälschter SMS-Nachrichten. Deine Aufgabe ist es, eine detaillierte Analyse der Nachricht durchzuführen. Deine Antwort sollte in drei Abschnitte unterteilt sein:
 <analysis>
-**Nachrichteninhaltsanalyse:**
-- Führe eine detaillierte Analyse des Nachrichteninhalts durch und identifiziere potenzielle rote Flaggen.
 </analysis>
 <risk_assessment>
-**Betrugsrisikobewertung:**
-- Bewerte die Wahrscheinlichkeit, dass die Nachricht betrügerisch ist.
 </risk_assessment>
 <recommendations>
-**Empfehlungen für den Benutzer:**
-- Gib klare und spezifische Empfehlungen zu den nächsten Schritten.
 </recommendations>
         """,
         'English': """
-You are an advanced AI assistant specializing in identifying fake SMS messages. Your task is to conduct a detailed analysis of the message. Your response should be divided into three sections:
 <analysis>
-**Message Content Analysis:**
-- Conduct a detailed analysis of the message content and identify potential red flags.
 </analysis>
 <risk_assessment>
-**Fraud Risk Assessment:**
-- Assess the likelihood that the message is fraudulent.
 </risk_assessment>
 <recommendations>
-**User Recommendations:**
-- Provide clear and specific recommendations regarding the next steps the user should take.
 </recommendations>
         """
     }
@@ -240,7 +315,7 @@ Additional Information:
 Provide your analysis and conclusions following the guidelines above."""
     payload = {
-        "model": "Meta-Llama-3.1-8B-Instruct",
         "messages": [
             {"role": "system", "content": system_prompt},
             {"role": "user", "content": user_prompt}
@@ -355,8 +430,9 @@ def extract_text_from_image(image_file):
 def get_email_info(email):
     """Sprawdza informacje o nadawcy e-maila (np. domena, organizacja, kraj)."""
     domain = email.split('@')[-1]  # Prosta ekstrakcja domeny
     return {
         "domain": domain,
-        "organization": "Nieznana organizacja",
-        "country": "Nieznany kraj"
     }

     """Ładuje dane z pliku JSON. Jeśli plik nie istnieje, zwraca pustą listę lub domyślny obiekt."""
     if not os.path.exists(file_path):
         if file_path.endswith('stats.json'):
+            return {"total_analyses": 0, "total_frauds_detected": 0, "total": 0}  # Dodaj klucz 'total'
         else:
             return []
     with open(file_path, 'r', encoding='utf-8') as file:
         except json.JSONDecodeError:
             logging.error(f"Nie można załadować danych z {file_path}. Plik jest uszkodzony.")
             if file_path.endswith('stats.json'):
+                return {"total_analyses": 0, "total_frauds_detected": 0, "total": 0}  # Dodaj klucz 'total'
             return []
 def save_json(file_path, data):
     history = load_json(HISTORY_FILE)
     history.append({
         "timestamp": datetime.now().isoformat(),
+        "date": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),  # Dodaj klucz 'date'
         "message": message,
         "phone_number": phone_number,
         "analysis": analysis,
     """Aktualizuje statystyki analiz w pliku stats.json."""
     stats = load_json(STATS_FILE)
     stats["total_analyses"] += 1
+    stats["total"] += 1  # Dodajemy do całkowitej liczby analiz
     if fraud_detected:
         stats["total_frauds_detected"] += 1
     save_json(STATS_FILE, stats)
+    logging.info(f"Statystyki zostały zaktualizowane: Analiz {stats['total_analyses']}, Oszustw {stats['total_frauds_detected']}, Łącznie {stats['total']}.")
 def get_stats():
     """Pobiera statystyki analiz z pliku stats.json."""
     """Weryfikuje numer telefonu i zwraca informacje o kraju i operatorze."""
     try:
         parsed_number = phonenumbers.parse(phone_number, None)
+        country = geocoder.description_for_number(parsed_number, 'pl')  # Zmiana na 'pl' dla polskiego
+        operator = carrier.name_for_number(parsed_number, 'pl')  # Zmiana na 'pl' dla polskiego
         if not country:
             country = "Nieznany"
         if not operator:
         logging.error("Brak klucza API.")
         return "Brak klucza API.", "Brak klucza API.", "Brak klucza API."
+    url = "https://api.sambanova.ai/v1/chat/completions"  # Upewnij się, że to poprawny URL
     headers = {
         "Authorization": f"Bearer {api_key}",
         "Content-Type": "application/json"
 **📝 Analiza Treści Wiadomości:**
 - Przeprowadź szczegółową analizę treści wiadomości, identyfikując potencjalne czerwone flagi, takie jak błędy językowe, prośby o dane osobowe, pilne prośby o kontakt itp.
 - Jakie elementy treści mogą wskazywać na oszustwo?
+- Jakie słowa kluczowe są używane w wiadomości? (np. "pieniądze", "przelew", "nagroda")
+- Jakie są reakcje na tę wiadomość w kontekście kulturowym i językowym?
+**❓ Dodatkowe pytania do przemyślenia:**
+- Kiedy i jak często otrzymujesz wiadomości z tego numeru?
+- Czy numer nadawcy jest znany z innych źródeł?
+- Jakie są konsekwencje dla Ciebie, jeśli ta wiadomość jest oszustwem?
+- Jakie masz doświadczenia z podobnymi wiadomościami w przeszłości?
 </analysis>
 <risk_assessment>
 **⚖️ Ocena Ryzyka Oszustwa:**
 - Na podstawie analizy treści i dostępnych informacji oceń prawdopodobieństwo, że wiadomość jest oszustwem. Użyj skali od 1 do 10, gdzie 1 oznacza bardzo niskie ryzyko, a 10 bardzo wysokie ryzyko.
+- Jakie czynniki wpływają na tę ocenę?
+- Jakie są argumenty za i przeciw ocenie tej wiadomości jako oszustwa?
+**❓ Dodatkowe pytania do przemyślenia:**
+- Jakie inne wiadomości z tego numeru otrzymywałeś w przeszłości?
+- Czy wiadomość zawiera jakiekolwiek inne informacje, które mogłyby być użyteczne w ocenie ryzyka?
+- Jakie są Twoje dotychczasowe doświadczenia z oszustwami SMS?
+- Jakie są Twoje przemyślenia na temat nadawcy tej wiadomości?
 </risk_assessment>
 <recommendations>
 **💡 Zalecenia dla Użytkownika:**
 - Podaj jasne i konkretne zalecenia dotyczące dalszych kroków, które użytkownik powinien podjąć.
+- Jakie środki bezpieczeństwa powinny być wdrożone?
+**❓ Dodatkowe pytania do przemyślenia:**
+- Czy powinieneś zgłosić tę wiadomość do operatora sieci?
+- Jakie dodatkowe kroki możesz podjąć, aby upewnić się, że nie padłeś ofiarą oszustwa?
+- Czy masz dostęp do innych narzędzi, które mogą pomóc w ocenie tej wiadomości?
+- Jakie działania możesz podjąć, aby zwiększyć swoje bezpieczeństwo w przyszłości?
 </recommendations>
         """,
         'German': """
+Du bist ein fortgeschrittener KI-Assistent, spezialisiert auf die Identifizierung gefälschter SMS-Nachrichten. Deine Aufgabe ist es, eine detaillierte Analyse der Nachricht durchzuführen, indem du einen tiefgreifenden Denkprozess nutzt und eine umfassende Bewertung lieferst. Deine Antwort sollte in drei Abschnitte unterteilt sein:
 <analysis>
+**📝 Nachrichteninhaltsanalyse:**
+- Führe eine detaillierte Analyse des Nachrichteninhalts durch und identifiziere potenzielle rote Flaggen wie sprachliche Fehler, Aufforderungen zur Preisgabe persönlicher Daten, dringende Kontaktanfragen usw.
+- Welche Elemente im Inhalt könnten auf Betrug hinweisen?
+- Welche Schlüsselwörter werden in der Nachricht verwendet? (z. B. "Geld", "Überweisung", "Preis")
+- Wie reagieren die Menschen auf diese Nachricht im kulturellen und sprachlichen Kontext?
+**❓ Zusätzliche Fragen zur Überlegung:**
+- Wann und wie oft erhältst du Nachrichten von dieser Nummer?
+- Ist die Nummer des Absenders aus anderen Quellen bekannt?
+- Was sind die Konsequenzen für dich, wenn diese Nachricht ein Betrug ist?
+- Welche Erfahrungen hast du in der Vergangenheit mit ähnlichen Nachrichten gemacht?
 </analysis>
 <risk_assessment>
+**⚖️ Betrugsrisikobewertung:**
+- Bewerte die Wahrscheinlichkeit, dass die Nachricht betrügerisch ist, auf einer Skala von 1 bis 10, wobei 1 sehr geringes Risiko und 10 sehr hohes Risiko bedeutet.
+- Welche Faktoren beeinflussen diese Bewertung?
+- Was sind die Argumente für und gegen die Bewertung dieser Nachricht als Betrug?
+**❓ Zusätzliche Fragen zur Überlegung:**
+- Welche anderen Nachrichten hast du in der Vergangenheit von dieser Nummer erhalten?
+- Enthält die Nachricht weitere Informationen, die bei der Risikobewertung hilfreich sein könnten?
+- Welche bisherigen Erfahrungen hast du mit SMS-Betrügereien gemacht?
+- Welche Gedanken hast du über den Absender dieser Nachricht?
 </risk_assessment>
 <recommendations>
+**💡 Empfehlungen für den Benutzer:**
+- Gib klare und spezifische Empfehlungen zu den nächsten Schritten, die der Benutzer unternehmen sollte.
+- Welche Sicherheitsmaßnahmen sollten umgesetzt werden?
+**❓ Zusätzne Fragen zur Überlegung:**
+- Solltest du diese Nachricht deinem Mobilfunkanbieter melden?
+- Welche weiteren Schritte kannst du unternehmen, um sicherzustellen, dass du nicht Opfer eines Betrugs geworden bist?
+- Hast du Zugriff auf andere Werkzeuge, die dir helfen können, diese Nachricht zu bewerten?
+- Welche Maßnahmen kannst du ergreifen, um deine Sicherheit in Zukunft zu erhöhen?
 </recommendations>
         """,
         'English': """
+You are an advanced AI assistant specializing in identifying fake SMS messages. Your task is to conduct a detailed analysis of the message, utilizing a deep thinking process and providing a comprehensive assessment. Your response should be divided into three sections:
 <analysis>
+**📝 Message Content Analysis:**
+- Conduct a detailed analysis of the message content, identifying potential red flags such as language errors, requests for personal information, urgent contact requests, etc.
+- What elements of the content may indicate fraud?
+- What keywords are used in the message? (e.g., "money", "transfer", "prize")
+- What are the cultural and linguistic reactions to this message?
+**❓ Additional questions to consider:**
+- When and how often do you receive messages from this number?
+- Is the sender's number known from other sources?
+- What are the consequences for you if this message is a fraud?
+- What experiences have you had in the past with similar messages?
 </analysis>
 <risk_assessment>
+**⚖️ Fraud Risk Assessment:**
+- Assess the likelihood that the message is fraudulent on a scale from 1 to 10, where 1 indicates very low risk and 10 indicates very high risk.
+- What factors influence this assessment?
+- What are the arguments for and against assessing this message as fraud?
+**❓ Additional questions to consider:**
+- What other messages have you received from this number in the past?
+- Does the message contain any other information that could be useful in assessing the risk?
+- What previous experiences do you have with SMS scams?
+- What are your thoughts on the sender of this message?
 </risk_assessment>
 <recommendations>
+**💡 User Recommendations:**
+- Provide clear and concrete recommendations regarding the next steps the user should take.
+- What security measures should be implemented?
+**❓ Additional questions to consider:**
+- Should you report this message to your service provider?
+- What additional steps can you take to ensure that you have not fallen victim to a scam?
+- Do you have access to other tools that can help you assess this message?
+- What actions can you take to enhance your security in the future?
 </recommendations>
+Your response should be formatted exactly as specified above, using the <analysis>, <risk_assessment>, and <recommendations> tags. Ensure that each section is thoroughly and comprehensively filled out.
         """
     }
 Provide your analysis and conclusions following the guidelines above."""
     payload = {
+        "model": "Meta-Llama-3.1-8B-Instruct",  # Upewnij się, że to poprawny model API
         "messages": [
             {"role": "system", "content": system_prompt},
             {"role": "user", "content": user_prompt}
 def get_email_info(email):
     """Sprawdza informacje o nadawcy e-maila (np. domena, organizacja, kraj)."""
     domain = email.split('@')[-1]  # Prosta ekstrakcja domeny
+    # Możesz dodać więcej logiki do weryfikacji domeny
     return {
         "domain": domain,
+        "organization": "Nieznana organizacja",  # Możesz dodać logikę, aby zidentyfikować organizację
+        "country": "Nieznany kraj"  # Możesz dodać logikę, aby zidentyfikować kraj
     }