Spaces:

engralimalik
/

hackathon_lace

Running

App Files Files Community

engralimalik commited on Jan 26

Commit

ffb3516

verified ·

1 Parent(s): 281c408

Update app.py

Browse files

Files changed (1) hide show

app.py +49 -28

app.py CHANGED Viewed

@@ -5,36 +5,48 @@ from folium.plugins import MarkerCluster
 import requests
 from io import BytesIO
-# Load data from Excel URL
 def load_data(url):
-    response = requests.get(url)
-    # Read the Excel file from the response content
-    lat_long_data = pd.read_excel(BytesIO(response.content), sheet_name="lat long", engine='openpyxl')
-    measurement_data = pd.read_excel(BytesIO(response.content), sheet_name="measurement data", engine='openpyxl')
-    # Merge data on school_id_giga
-    merged_data = pd.merge(
-        lat_long_data,
-        measurement_data,
-        left_on="school_id_giga",
-        right_on="school_id_giga",
-        how="inner"
-    )
-    # Strip any extra spaces from column names
-    merged_data.columns = merged_data.columns.str.strip()
-    return merged_data
 # Perform clustering to find data center location
 def find_data_center(df, n_clusters=1):
     kmeans = KMeans(n_clusters=n_clusters, random_state=0).fit(df[["latitude", "longitude"]])
     return kmeans.cluster_centers_
 # Plot the map with markers
 def plot_map(df, center):
-    # Print column names for debugging
-    print(df.columns)
     map = folium.Map(location=[center[0][0], center[0][1]], zoom_start=10)
     marker_cluster = MarkerCluster().add_to(map)
@@ -63,7 +75,9 @@ def plot_map(df, center):
 # Calculate the impact of data center on latency and bandwidth
 def calculate_impact(df, center):
-    # Calculate average latency and bandwidth before the data center
     avg_latency_before = df['latency'].mean()
     avg_download_before = df['download_speed'].mean()
     avg_upload_before = df['upload_speed'].mean()
@@ -98,20 +112,27 @@ def main():
     url = "https://huggingface.co/spaces/engralimalik/lace/resolve/main/data%20barbados.xlsx"  # URL of your Excel file
     df = load_data(url)
     # Find the data center location using clustering
     center = find_data_center(df)
     # Create the map and save it
     map = plot_map(df, center)
-    map.save("index.html")
     # Calculate the impact of adding the data center
     latency_reduction, download_increase, upload_increase, avg_latency_before, avg_download_before, avg_upload_before = calculate_impact(df, center)
-    # Display the impact
-    impact_data = display_impact(latency_reduction, download_increase, upload_increase, avg_latency_before, avg_download_before, avg_upload_before)
-    print("Impact of Data Center on Latency and Bandwidth:")
-    print(impact_data)
     print("Map has been saved as index.html.")

 import requests
 from io import BytesIO
+# Load data from Excel URL with error handling
 def load_data(url):
+    try:
+        print("Loading data from:", url)
+        response = requests.get(url)
+        if response.status_code == 200:
+            lat_long_data = pd.read_excel(BytesIO(response.content), sheet_name="lat long", engine='openpyxl')
+            measurement_data = pd.read_excel(BytesIO(response.content), sheet_name="measurement data", engine='openpyxl')
+            # Merge data on school_id_giga
+            merged_data = pd.merge(
+                lat_long_data,
+                measurement_data,
+                left_on="school_id_giga",
+                right_on="school_id_giga",
+                how="inner"
+            )
+            # Strip any extra spaces from column names
+            merged_data.columns = merged_data.columns.str.strip()
+            print("Data loaded successfully")
+            return merged_data
+        else:
+            print(f"Failed to load data. Status code: {response.status_code}")
+            return pd.DataFrame()
+    except Exception as e:
+        print(f"Error loading data: {e}")
+        return pd.DataFrame()
 # Perform clustering to find data center location
 def find_data_center(df, n_clusters=1):
+    if df.empty:
+        print("Dataframe is empty, skipping clustering")
+        return None
     kmeans = KMeans(n_clusters=n_clusters, random_state=0).fit(df[["latitude", "longitude"]])
     return kmeans.cluster_centers_
 # Plot the map with markers
 def plot_map(df, center):
+    if df.empty:
+        print("Dataframe is empty, skipping map plotting")
+        return None
     map = folium.Map(location=[center[0][0], center[0][1]], zoom_start=10)
     marker_cluster = MarkerCluster().add_to(map)
 # Calculate the impact of data center on latency and bandwidth
 def calculate_impact(df, center):
+    if df.empty:
+        print("Dataframe is empty, skipping impact calculation")
+        return None
     avg_latency_before = df['latency'].mean()
     avg_download_before = df['download_speed'].mean()
     avg_upload_before = df['upload_speed'].mean()
     url = "https://huggingface.co/spaces/engralimalik/lace/resolve/main/data%20barbados.xlsx"  # URL of your Excel file
     df = load_data(url)
+    if df.empty:
+        print("No data to process, exiting application.")
+        return
     # Find the data center location using clustering
     center = find_data_center(df)
+    if center is None:
+        print("Could not find data center, exiting application.")
+        return
     # Create the map and save it
     map = plot_map(df, center)
+    if map:
+        map.save("index.html")
     # Calculate the impact of adding the data center
     latency_reduction, download_increase, upload_increase, avg_latency_before, avg_download_before, avg_upload_before = calculate_impact(df, center)
+    if latency_reduction is not None:
+        impact_data = display_impact(latency_reduction, download_increase, upload_increase, avg_latency_before, avg_download_before, avg_upload_before)
+        print("Impact of Data Center on Latency and Bandwidth:")
+        print(impact_data)
     print("Map has been saved as index.html.")