init

2025-12-06 10:43:48 +08:00 · 2024-06-25 16:01:57 +08:00
commit 2137d41d0b
10 changed files with 1223 additions and 0 deletions
--- a/analyzer.py
+++ b/analyzer.py
@@ -0,0 +1,65 @@
+"""
+Analyzer Module
+
+This module provides functionality for analyzing data in the Starbucks Global Store Data Analysis Program.
+
+The Analyzer class contains methods for performing various analyses on the Starbucks store data,
+including calculating total stores, unique countries, and identifying top countries and cities.
+
+Classes:
+    Analyzer: A class containing methods for data analysis and result formatting.
+
+Dependencies:
+    pandas: For data manipulation and analysis.
+    typing: For type hinting.
+"""
+
+import pandas as pd
+from typing import Dict, Any
+
+class Analyzer:
+    """
+    A class for analyzing Starbucks store data.
+
+    This class provides methods to perform various analyses on the Starbucks store data
+    and format the results for presentation.
+
+    Methods:
+        analyze_data(df: pd.DataFrame) -> Dict[str, Any]:
+            Perform analysis on the given DataFrame and return the results.
+        format_analysis(analysis: Dict[str, Any]) -> str:
+            Format the analysis results into a human-readable string.
+    """
+
+    @staticmethod
+    def analyze_data(df: pd.DataFrame) -> Dict[str, Any]:
+        """
+        Perform analysis on the given DataFrame.
+
+        This method calculates various statistics from the Starbucks store data,
+        including total number of stores, number of countries, top country, and top city.
+
+        Args:
+            df (pd.DataFrame): The DataFrame containing the Starbucks store data.
+
+        Returns:
+            Dict[str, Any]: A dictionary containing the analysis results.
+                Keys include:
+                - 'total_stores': Total number of unique stores
+                - 'total_countries': Total number of unique countries
+                - 'top_country': Country with the most stores
+                - 'top_city': City with the most stores
+        """
+        return {
+            'total_stores': df['Store Number'].nunique(),
+            'total_countries': df['Country'].nunique(),
+            'top_country': df['Country'].value_counts().index[0],
+            'top_city': df['City'].value_counts().index[0]
+        }
+
+    @staticmethod
+    def format_analysis(analysis: Dict[str, Any]) -> str:
+        return (f"星巴克在全球共有 {analysis['total_stores']} 家店铺，"
+                f"分布在 {analysis['total_countries']} 个国家和地区，"
+                f"店铺数量最多的国家是 {analysis['top_country']}，"
+                f"城市是 {analysis['top_city']}。")