USGS批量下载站点日径流数据

殷玉领

已于 2024-04-24 21:57:42 修改

阅读量510

点赞数 4

文章标签： python

于 2024-04-24 21:50:27 首次发布

本文链接：https://blog.csdn.net/yinbaoshun/article/details/138170433

版权

1、下载代码

import requests
import os

def read_site_ids(file_path):
    """
    Reads a file containing site IDs and returns a list of IDs.

    :param file_path: The path to the file containing site IDs.
    :return: A list of site IDs.
    """
    site_ids = []
    with open(file_path, 'r') as file:
        for line in file:
            # Assuming the site IDs are in the second column, separated by whitespace
            parts = line.split()
            if parts and len(parts) > 1:
                try:
                    # Verify it's an 8-digit number before adding
                    site_id = int(parts[1])
                    if len(str(site_id)) == 8:
                        site_ids.append(str(site_id))
                except ValueError:
                    # If it's not a number, move to the next line
                    continue
    return site_ids

def construct_url(site_id):
    """
    Constructs the URL to download data for a given site ID.

    :param site_id: The site ID to construct the URL for.
    :return: The constructed URL.
    """
    base_url = 'https://waterdata.usgs.gov/nwis/dv'
    params = {
        'cb_00060': 'on',
        'format': 'rdb',
        'site_no': site_id,
        'legacy': '',
        'referred_module': 'sw',
        'period': '',
        'begin_date': '1980-01-01',
        'end_date': '2020-12-31'
    }
    # Construct the URL with query parameters
    query_string = '&'.join([f"{key}={value}" for key, value in params.items()])
    url = f"{base_url}?{query_string}"
    return url

def download_txt_file(url, filename, target_folder):
    """
    Downloads a text file from a given URL and saves it to a target folder.

    :param url: The URL to download the file from.
    :param filename: The name to save the file as.
    :param target_folder: The folder to save the file in.
    """
    import requests
    # Get the content from the URL
    response = requests.get(url, allow_redirects=True)
    if response.status_code == 200:
        # Save the content to a file in the target folder
        with open(f"{target_folder}/{filename}", 'wb') as f:
            f.write(response.content)
    else:
        print(f"Failed to download data for site {filename} - Status code: {response.status_code}")

# We will comment out the actual calls to these functions and provide them for execution on the user's local environment
# Assume we're reading from '/mnt/data/Sites_ID_USGS.txt'
file_path = 'E:/Dataset_2024/Sites_ID_USGS.txt'
site_ids = read_site_ids(file_path)
target_folder = 'E:/Dataset_2024/USGS/'  # Assume this is the target folder
# Uncomment the following code to perform the download (to be run by the user locally)

for site_id in site_ids:
    url = construct_url(site_id)
    download_txt_file(url, f"{site_id}.txt", target_folder)