Corey Morris
commited on
Commit
·
25b87bf
1
Parent(s):
0a77c60
using URL as file name
Browse files- details_data_processor.py +14 -15
details_data_processor.py
CHANGED
|
@@ -28,28 +28,27 @@ class DetailsDataProcessor:
|
|
| 28 |
matching_files.append(filename) # Append the matching filename to the list
|
| 29 |
return matching_files # Return the list of matching filenames
|
| 30 |
|
|
|
|
| 31 |
@staticmethod
|
| 32 |
-
def download_file(url,
|
| 33 |
-
#
|
| 34 |
-
|
| 35 |
-
error_count = 0
|
| 36 |
-
success_count = 0
|
| 37 |
-
# timestamp = datetime.now()
|
| 38 |
|
| 39 |
-
#
|
| 40 |
-
|
| 41 |
|
| 42 |
-
#
|
| 43 |
-
|
| 44 |
|
| 45 |
-
|
| 46 |
-
save_file_path = save_file_path + "_" + str(unique_id) + ".json"
|
| 47 |
|
|
|
|
|
|
|
| 48 |
try:
|
| 49 |
# Sending a GET request
|
| 50 |
r = requests.get(url, allow_redirects=True)
|
| 51 |
-
r.raise_for_status()
|
| 52 |
-
|
| 53 |
# Writing the content to the specified file
|
| 54 |
with open(save_file_path, 'wb') as file:
|
| 55 |
file.write(r.content)
|
|
@@ -63,8 +62,8 @@ class DetailsDataProcessor:
|
|
| 63 |
error_count += 1
|
| 64 |
except Exception as e:
|
| 65 |
error_count += 1
|
| 66 |
-
return error_count, success_count
|
| 67 |
|
|
|
|
| 68 |
|
| 69 |
|
| 70 |
@staticmethod
|
|
|
|
| 28 |
matching_files.append(filename) # Append the matching filename to the list
|
| 29 |
return matching_files # Return the list of matching filenames
|
| 30 |
|
| 31 |
+
|
| 32 |
@staticmethod
|
| 33 |
+
def download_file(url, directory='details_data'):
|
| 34 |
+
# Define the prefix to be removed from the URL
|
| 35 |
+
url_prefix = "https://huggingface.co/datasets/open-llm-leaderboard/details/resolve/main/"
|
|
|
|
|
|
|
|
|
|
| 36 |
|
| 37 |
+
# Remove the prefix from the URL
|
| 38 |
+
file_name_part = url.replace(url_prefix, '')
|
| 39 |
|
| 40 |
+
# Replace characters that don't play nice with file systems
|
| 41 |
+
safe_file_name = re.sub(r'[<>:"/\\|?*]', '_', file_name_part) # Replace with '_'
|
| 42 |
|
| 43 |
+
save_file_path = os.path.join(directory, safe_file_name)
|
|
|
|
| 44 |
|
| 45 |
+
error_count = 0
|
| 46 |
+
success_count = 0
|
| 47 |
try:
|
| 48 |
# Sending a GET request
|
| 49 |
r = requests.get(url, allow_redirects=True)
|
| 50 |
+
r.raise_for_status()
|
| 51 |
+
|
| 52 |
# Writing the content to the specified file
|
| 53 |
with open(save_file_path, 'wb') as file:
|
| 54 |
file.write(r.content)
|
|
|
|
| 62 |
error_count += 1
|
| 63 |
except Exception as e:
|
| 64 |
error_count += 1
|
|
|
|
| 65 |
|
| 66 |
+
return error_count, success_count
|
| 67 |
|
| 68 |
|
| 69 |
@staticmethod
|