10个python自动化日常任务实战脚本示例

2060 篇文章 51 订阅
789 篇文章 1 订阅

CSV文件数据清洗工具

import csv
def clean_csv(input_file, output_file):
    with open(input_file, mode='r', newline='', encoding='utf-8') as infile, \
         open(output_file, mode='w', newline='', encoding='utf-8') as outfile:
        reader = csv.reader(infile)
        writer = csv.writer(outfile)
        for row in reader:
            # 清洗数据,例如删除空格
            cleaned_row = [cell.strip() for cell in row]
            writer.writerow(cleaned_row)
input_file = '/path/to/input.csv'
output_file = '/path/to/cleaned_output.csv'
clean_csv(input_file, output_file)

文本文件翻译工具

from deep_translator import GoogleTranslator
def translate_text(input_file, output_file, target_language):
    with open(input_file, 'r', encoding='utf-8') as file:
        text = file.read()
    translated_text = GoogleTranslator(source='auto', target=target_language).translate(text)
    with open(output_file, 'w', encoding='utf-8') as file:
        file.write(translated_text)
input_file = '/path/to/your/text.txt'
output_file = '/path/to/translated_text.txt'
target_language = 'es'  # 西班牙语
translate_text(input_file, output_file, target_language)

文件夹内容同步工具

import shutil
import os
def sync_folders(src_folder, dst_folder):
    for item in os.listdir(src_folder):
        s = os.path.join(src_folder, item)
        d = os.path.join(dst_folder, item)
        if os.path.isdir(s):
            shutil.copytree(s, d, dirs_exist_ok=True)
        else:
            shutil.copy2(s, d)
src_folder = '/path/to/source/folder'
dst_folder = '/path/to/destination/folder'
sync_folders(src_folder, dst_folder)

数据备份到云存储服务

import boto3
def upload_to_s3(bucket_name, local_file_path, remote_file_path):
    s3 = boto3.client('s3')
    s3.upload_file(local_file_path, bucket_name, remote_file_path)
bucket_name = 'your-bucket-name'
local_file_path = '/path/to/your/local/file'
remote_file_path = 'path/to/remote/file'
upload_to_s3(bucket_name, local_file_path, remote_file_path)

文件夹内容统计工具​​​​​​​

import os
def count_files_and_dirs(directory):
    total_files = 0
    total_dirs = 0
    for root, dirs, files in os.walk(directory):
        total_files += len(files)
        total_dirs += len(dirs)
    return total_files, total_dirs
directory = '/path/to/your/directory'
files, dirs = count_files_and_dirs(directory)
print(f"Total files: {files}, Total directories: {dirs}")

文件类型分类工具

import os
def classify_files_by_type(directory):
    file_types = {}
    for filename in os.listdir(directory):
        if os.path.isfile(os.path.join(directory, filename)):
            extension = os.path.splitext(filename)[1]
            if extension in file_types:
                file_types[extension] += 1
            else:
                file_types[extension] = 1
    return file_types
directory = '/path/to/your/directory'
file_types = classify_files_by_type(directory)
for ext, count in file_types.items():
    print(f"Files with extension '{ext}': {count}")

图像识别标签生成

from PIL import Image
from pytesseract import pytesseract
def image_to_text(image_path):
    img = Image.open(image_path)
    text = pytesseract.image_to_string(img)
    return text
image_path = '/path/to/your/image.png'
text = image_to_text(image_path)
print(f"Text from image: {text}")

视频转音频工具

from moviepy.editor import VideoFileClip
def convert_video_to_audio(video_path, audio_path):
    clip = VideoFileClip(video_path)
    clip.audio.write_audiofile(audio_path)
video_path = '/path/to/your/video.mp4'
audio_path = '/path/to/converted/audio.mp3'
convert_video_to_audio(video_path, audio_path)

从网页提取图片​​​​​​​

import requests
from bs4 import BeautifulSoup
import os
def extract_images_from_webpage(url, output_dir):
    response = requests.get(url)
    soup = BeautifulSoup(response.text, 'html.parser')
    images = soup.find_all('img')
    os.makedirs(output_dir, exist_ok=True)
    for image in images:
        src = image.get('src')
        if src and src.startswith('http'):
            image_data = requests.get(src).content
            filename = os.path.join(output_dir, os.path.basename(src))
            with open(filename, 'wb') as f:
                f.write(image_data)
url = 'https://example.com'
output_dir = '/path/to/output/images'
extract_images_from_webpage(url, output_dir)

文本摘要生成工具​​​​​​​

from transformers import pipeline
def generate_summary(text):
    summarizer = pipeline("summarization")
    summary = summarizer(text, max_length=130, min_length=30, do_sample=False)
    return summary[0]['summary_text']
text = """Lorem ipsum dolor sit amet, consectetur adipiscing elit. 
Sed non risus. Suspendisse lectus tortor, dignissim sit amet, adipiscing nec, ultricies sed, dolor."""
summary = generate_summary(text)print(f"Summary: {summary}")

最后: 下方这份完整的软件测试视频教程已经整理上传完成,需要的朋友们可以自行领取【保证100%免费】

在这里插入图片描述

软件测试面试文档

我们学习必然是为了找到高薪的工作,下面这些面试题是来自阿里、腾讯、字节等一线互联网大厂最新的面试资料,并且有字节大佬给出了权威的解答,刷完这一套面试资料相信大家都能找到满意的工作。

在这里插入图片描述

在这里插入图片描述

  • 1
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值