根据网络热点生成文章

xdtz · 2024 年8 月 5 日 02:26

大概算是个副业推荐？按照前两天在坛里看到帖子的逻辑，省略了数据库部分，直接让gpt给我写了一个代码，用了一下能出文章，不过这文章有没有人看就见仁见智了。

import requests
import logging
from collections import Counter
import re
import json

# 设置日志记录配置
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')

# 设置 OpenAI API 密钥和 base_url
api_key = 'sk-xxxxxx'
api_base = "https://gpt.com"

# 定义函数：从指定API获取热搜信息
def fetch_hot_topics():
    urls = [
        'https://api.suxun.site/api/hotlist?id=douyin',
        'https://api.suxun.site/api/hotlist?id=weibo'
        # 可以添加更多数据源
    ]
    hot_topics = []
    for url in urls:
        try:
            response = requests.get(url)
            response.raise_for_status()  # 检查请求是否成功
            topics = response.json().get('data', [])
            hot_topics.extend([topic['title'] for topic in topics])
        except requests.RequestException as e:
            logging.error(f"请求 {url} 失败: {e}")
    return hot_topics

# 定义函数：预处理和标准化话题
def preprocess_topics(topics):
    return [re.sub(r'\W+', '', topic).lower() for topic in topics]

# 定义函数：合并相同类似的热门话题
def merge_topics(topics):
    headers = {
        'Content-Type': 'application/json',
        'Authorization': f'Bearer {api_key}',
    }
    data = {
        "model": "gpt-4-turbo",
        "messages": [
            {"role": "system", "content": "你是一个专业的文本处理助手。我将给你一些话题列表，请将相似的话题用,间隔后放在同一行，不同的话题换行"},
            {"role": "user", "content": f"我给出的话题是：\n{topics}\n"}
        ],
        "max_tokens": 8000
    }
    try:
        response = requests.post(f"{api_base}/chat/completions", headers=headers, json=data)
        response.raise_for_status()  # 检查请求是否成功
        response_data = response.json()
        merged_topics = response_data['choices'][0]['message']['content'].split('\n')
        return merged_topics
    except requests.RequestException as e:
        logging.error(f"请求合并话题失败: {e}")
    except KeyError as e:
        logging.error(f"响应中缺少预期的字段: {e}")
    except json.JSONDecodeError as e:
        logging.error(f"JSON 解析错误: {e}")
    return []

# 定义函数：获取最热的10条话题
def get_top_10_topics(merged_topics):
    # 统计每行的合并话题中逗号和中文逗号的数量
    def count_commas(topic):
        return topic.count(',') + topic.count('，')
    # 按照逗号和中文逗号的总数进行排序
    sorted_topics = sorted(merged_topics, key=count_commas, reverse=True)
    # 获取排序后前10条数据，并去除空格后返回
    top_10_topics = [topic.replace(' ', '') for topic in sorted_topics[:10]]
    return top_10_topics

# 定义函数：搜索新闻信息
def search_article(summary):
    headers = {
        'Content-Type': 'application/json',
        'Authorization': f'Bearer {api_key}',
    }
    data = {
        "model": "kimi",
        "stream": False,
        "messages": [
            {"role": "system", "content": "你是一个专业的AI助手。"},
            {"role": "user", "content": f"搜索：\n{summary}\n相关的最新10条新闻，给出每条新闻的大致内容及其要点"}
        ],
        "max_tokens": 8000
    }
    try:
        response = requests.post(f"{api_base}/chat/completions", headers=headers, json=data)
        response.raise_for_status()  # 检查请求是否成功
        response_data = response.json()
        return response_data['choices'][0]['message']['content'].strip()
    except requests.RequestException as e:
        logging.error(f"请求搜索新闻信息失败: {e}")
    except KeyError as e:
        logging.error(f"响应中缺少预期的字段: {e}")
    return "无法获取新闻信息"

# 定义函数：写文章
def write_article(summary):
    headers = {
        'Content-Type': 'application/json',
        'Authorization': f'Bearer {api_key}',
    }
    data = {
        "model": "gpt-4o",
        "messages": [
            {"role": "system", "content": "你是一个资深的自媒体创作者"},
            {"role": "user", "content": f"新闻内容：{summary} \n 根据新闻内容，写一篇贴近生活、幽默风趣的文章，内容包括标题、引言、正文和结论。"}
        ],
        "max_tokens": 8000
    }
    try:
        response = requests.post(f"{api_base}/chat/completions", headers=headers, json=data)
        response.raise_for_status()  # 检查请求是否成功
        response_data = response.json()
        article = response_data['choices'][0]['message']['content'].strip()
        return article
    except requests.RequestException as e:
        logging.error(f"请求写文章失败: {e}")
    except KeyError as e:
        logging.error(f"响应中缺少预期的字段: {e}")
    return "无法生成文章", "文章生成失败"

# 定义函数：保存文章为txt文件
def save_article(topic, article):
    valid_topic = ''.join(e for e in topic if e.isalnum())
    filename = f'{valid_topic}.txt'
    
    # 检查 article 的类型
    if isinstance(article, str):
        content = article
    elif isinstance(article, tuple):
        content = ' '.join(str(item) for item in article)
    else:
        raise TypeError("Unsupported type for article")
    
    with open(filename, 'w', encoding='utf-8') as file:
        file.write(content)

# 执行整个流程
def run_once():
    hot_topics = fetch_hot_topics()
    processed_topics = preprocess_topics(hot_topics)
    merged_topics = merge_topics(processed_topics)
    top_10_topics = get_top_10_topics(merged_topics)
    
    for topic in top_10_topics:
        searchD = search_article(topic)
        article = write_article(searchD)
        save_article(topic, article)
        print(f"已生成文章并保存为 {topic}.txt")

# 运行一次
run_once()

效果如下

handsome · 2024 年8 月 5 日 02:31

感谢，为什么在深海

xdtz · 2024 年8 月 5 日 02:33

不晓得放哪就随便放一下

handsome · 2024 年8 月 5 日 02:33

从深海到软件分享

Just4L · 2024 年8 月 5 日 02:38

看着挺有意思的

jiongjiong_JOJO · 2024 年8 月 5 日 02:39

感谢分享！

Bonus1794 · 2024 年8 月 5 日 02:39

感谢分享

crystalwind · 2024 年8 月 5 日 05:06

这个想法不错，不过gpt用中文输出的文案感觉并不是特别好

xdtz · 2024 年8 月 5 日 05:07

这个东西现在要搞的话，你得多账号走量，提示词也要再优化，我就是根据佬友的例子做了个demo

crystalwind · 2024 年8 月 5 日 05:15

确实，如果不去专门搞prompt的话，感觉一般AI产出的内容并没有特别强的IP属性，至少目前走量可能是相对合理的解法

2863079308 · 2024 年8 月 5 日 05:23

感谢分享

JerryXu09 · 2024 年8 月 5 日 05:29

写得风格有点人机不过稍微调整一下就可以了

DROP_TABLE.user_info · 2024 年8 月 5 日 05:30

感谢分享

JerryXu09 · 2024 年8 月 5 日 05:31

问题是，投到哪里能赚钱呢

DROP_TABLE.user_info · 2024 年8 月 5 日 05:32

卖教程啊，现在都是赚想赚钱的人的钱

JerryXu09 · 2024 年8 月 5 日 05:33

学到了还能这样

MuskZhou · 2024 年8 月 5 日 05:43

为什么会出现2024-08-05 13:36:57,992 - ERROR - 请求合并话题失败: Expecting value: line 1 column 1 (char 0)啊

xdtz · 2024 年8 月 5 日 05:45

你得用自己的key 啊…

MuskZhou · 2024 年8 月 5 日 05:45

我用了

xdtz · 2024 年8 月 5 日 05:50

那你的走调试自己看看了，我这边是正常的

话题		回复	浏览量
ai自动写自媒体赚钱资源荟萃人工智能	151	5765	2025 年2 月 22 日
总算用上了Deep Research，来看看中华美食报告搞七捻三 ChatGPT , 人工智能 , 纯水	44	1363	2025 年3 月 5 日
大家都用什么来翻译文献开发调优快问快答	38	2087	2024 年8 月 29 日
开了一个月GPT，但是想不出什么问题问感觉好浪费，想问问家人们有没有什么想问GPT4的问题，可以在评论区打出来，跳蚤市场 ChatGPT , 人工智能	22	667	2024 年11 月 24 日
AIGC大生成时代降低AI率的一些感想开发调优人工智能 , 纯水	52	840	2025 年3 月 8 日

根据网络热点生成文章

相关话题