├── .dockerignore
├── .env
├── .gitignore
├── Dockerfile
├── LICENSE
├── LearnSpider
    ├── __init__.py
    ├── asgi.py
    ├── local_settings.py
    ├── settings.py
    ├── urls.py
    ├── views.py
    └── wsgi.py
├── README.md
├── api
    ├── __init__.py
    ├── admin.py
    ├── apps.py
    ├── migrations
    │   └── __init__.py
    ├── models.py
    ├── tests.py
    ├── urls.py
    └── views.py
├── collect_data
    ├── __init__.py
    ├── collect_news.py
    ├── collect_news_binance.py
    └── collect_news_block_beats.py
├── docker-compose.yml
├── docs
    └── 开发者文档.md
├── learn_spider-2025-02-27.sql
├── logs
    ├── django_debug.log
    └── django_error.log
├── manage.py
├── requirements.txt
├── spider_demo
    └── demo
    │   ├── demo
    │       ├── __init__.py
    │       ├── items.py
    │       ├── middlewares.py
    │       ├── pipelines.py
    │       ├── settings.py
    │       └── spiders
    │       │   ├── __init__.py
    │       │   ├── hello_scrapy.py
    │       │   ├── parse_demo.py
    │       │   └── post_spider.py
    │   ├── output.json
    │   └── scrapy.cfg
├── static
    ├── bootstrap
    │   ├── bootstrap-icons.css
    │   ├── bootstrap-icons.woff
    │   ├── bootstrap-icons.woff2
    │   ├── bootstrap.bundle.min.js
    │   └── bootstrap.min.css
    ├── imgs
    │   ├── 404.svg
    │   ├── favicon.ico
    │   ├── friends
    │   │   ├── learnspider_logo.png
    │   │   └── stardream_logo.png
    │   ├── logo-img.svg
    │   ├── logo.jpeg
    │   ├── logo.svg
    │   ├── sandbox
    │   │   ├── blog.jpeg
    │   │   ├── music.jpeg
    │   │   ├── news.jpeg
    │   │   ├── shop.jpeg
    │   │   ├── video.jpeg
    │   │   └── wallpaper.jpeg
    │   ├── setu
    │   │   ├── 1.jpg
    │   │   ├── 1.png
    │   │   ├── 2.jpg
    │   │   ├── 2.png
    │   │   ├── 3.jpg
    │   │   └── 3.png
    │   ├── sponsors
    │   │   ├── evolution_host.png
    │   │   ├── lky_logo.png
    │   │   ├── qgwl_logo.png
    │   │   └── yrx_logo.png
    │   └── support
    │   │   ├── lky.png
    │   │   ├── wx.jpg
    │   │   ├── yrx.png
    │   │   └── zfb.jpg
    └── js
    │   ├── cpython666.js
    │   ├── jquery-3.7.1.min.js
    │   └── popper.min.js
├── tasks.py
├── test
    ├── demo.py
    └── dp.py
└── topics
    ├── __init__.py
    ├── admin.py
    ├── apps.py
    ├── decorators.py
    ├── management
        ├── __init__.py
        └── commands
        │   ├── __init__.py
        │   ├── fetch_news_data.py
        │   ├── fetch_news_web3.py
        │   ├── update_category.py
        │   ├── update_difficulty_scores.py
        │   ├── update_order_ids.py
        │   └── update_pass_status.py
    ├── migrations
        ├── 0001_initial.py
        ├── 0002_web3newstag.py
        ├── 0003_web3news_web3newstag_tag_id_alter_web3newstag_name_and_more.py
        └── __init__.py
    ├── models.py
    ├── scheduler.py
    ├── serializers.py
    ├── static
        └── topics
        │   └── css
        │       └── style.css
    ├── tasks.py
    ├── templates
        └── topics
        │   ├── 404.html
        │   ├── base.html
        │   ├── demo.html
        │   ├── header.html
        │   ├── index
        │       ├── index.html
        │       ├── list.html
        │       ├── sandbox.html
        │       ├── shorthand.html
        │       └── tools.html
        │   ├── pages
        │       ├── 111.html
        │       ├── 112.html
        │       ├── ajax.html
        │       ├── asyncio.html
        │       ├── course-buying-guide.html
        │       ├── css-sprite.html
        │       ├── demo.html
        │       ├── demo_get_server_time.html
        │       ├── devtools.html
        │       ├── easy-spider.html
        │       ├── h1-6.html
        │       ├── hello-get.html
        │       ├── hello-post-form.html
        │       ├── hello-post-json.html
        │       ├── intro.html
        │       ├── lsp-spider.html
        │       ├── news.html
        │       ├── pagination-1.html
        │       ├── pagination-2.html
        │       ├── pagination-table.html
        │       ├── redirect.html
        │       ├── rowspan-table.html
        │       ├── spider-guide.html
        │       ├── spider-roadmap.html
        │       ├── svg.html
        │       ├── table-key-value.html
        │       └── wenjuan.html
        │   ├── sandbox
        │       ├── news
        │       │   ├── about_us.html
        │       │   ├── category.html
        │       │   ├── detail_category.html
        │       │   ├── detail_news.html
        │       │   ├── detail_source.html
        │       │   ├── news_base.html
        │       │   ├── news_header.html
        │       │   ├── news_hot.html
        │       │   ├── news_hot_detail.html
        │       │   ├── news_index.html
        │       │   ├── notice.html
        │       │   ├── technology.html
        │       │   └── web3.html
        │       └── wallpaper
        │       │   ├── wallpaper.html
        │       │   ├── wallpaper_base.html
        │       │   └── wallpaper_header.html
        │   ├── solutions.html
        │   ├── tools
        │       └── encode.html
        │   └── views
        │       ├── encode.html
        │       ├── hello-spider.html
        │       ├── request-twice-cookie.html
        │       ├── request-twice.html
        │       ├── table.html
        │       └── ua.html
    ├── tests.py
    ├── urls.py
    └── views.py


/.dockerignore:
--------------------------------------------------------------------------------
1 | .git
2 | .DS_Store
3 | .idea
4 | .env
5 | /static_root
6 | docs
7 | spider_demo
8 | __pycache__


--------------------------------------------------------------------------------
/.env:
--------------------------------------------------------------------------------
1 | DJANGO_ENV=local


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | .idea
 2 | staticfiles
 3 | __pycache__/
 4 | *.pyc
 5 | .DS_Store
 6 | /static/bootstrap/bootstrap-icons-1.11.3/
 7 | /static/bootstrap/bootstrap-icons-1.11.3.zip
 8 | bigsetu
 9 | LearnSpider/secret_settings.py
10 | static_root


--------------------------------------------------------------------------------
/Dockerfile:
--------------------------------------------------------------------------------
 1 | # 选择基础镜像
 2 | #FROM python:3.11
 3 | FROM python:3.11-slim
 4 | # 设置工作目录
 5 | WORKDIR /app
 6 | 
 7 | # 更新pip到最新版本
 8 | RUN pip install --upgrade pip
 9 | 
10 | # 复制项目文件
11 | COPY . .
12 | # 安装依赖
13 | RUN pip install --no-cache-dir -r requirements.txt -i https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple
14 | 
15 | # 指定运行命令
16 | CMD ["python", "manage.py", "runserver", "0.0.0.0:8001"]


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2024 CodeFly
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/LearnSpider/__init__.py:
--------------------------------------------------------------------------------
1 | import pymysql
2 | 
3 | pymysql.install_as_MySQLdb()
4 | 


--------------------------------------------------------------------------------
/LearnSpider/asgi.py:
--------------------------------------------------------------------------------
 1 | """
 2 | ASGI config for LearnSpider project.
 3 | 
 4 | It exposes the ASGI callable as a module-level variable named ``application``.
 5 | 
 6 | For more information on this file, see
 7 | https://docs.djangoproject.com/en/5.0/howto/deployment/asgi/
 8 | """
 9 | 
10 | import os
11 | 
12 | from django.core.asgi import get_asgi_application
13 | 
14 | os.environ.setdefault("DJANGO_SETTINGS_MODULE", "LearnSpider.settings")
15 | 
16 | application = get_asgi_application()
17 | 


--------------------------------------------------------------------------------
/LearnSpider/local_settings.py:
--------------------------------------------------------------------------------
 1 | SECRET_KEY = "your-secret-key"
 2 | # settings
 3 | # 多语言配置更改语言为中文
 4 | LANGUAGE_CODE = "zh-hans"
 5 | # 时区
 6 | TIME_ZONE = "Asia/Shanghai"
 7 | USE_TZ = True
 8 | APPEND_SLASH = True
 9 | 
10 | SITE_URL = "http://learnspider.vip"
11 | 
12 | CORS_ALLOWED_ORIGINS = [
13 |     "http://localhost:63342",  # 允许的前端地址
14 |     "http://localhost:8005",  # 允许的前端地址（如果有必要）
15 |     "http://localhost:5173",  # 允许的前端地址（如果有必要）
16 |     "http://localhost:4173",  # 允许的前端地址（如果有必要）
17 |     "http://localhost:4000",  # 允许的前端地址（如果有必要）
18 |     "http://www.learnspider.vip",
19 |     "http://learnspider.vip",
20 |     "http://localhost",
21 |     "http://127.0.0.1",
22 | ]
23 | ALLOWED_HOSTS = [
24 |     "www.learnspider.vip",
25 |     "learnspider.vip",
26 |     "127.0.0.1",
27 |     "localhost",
28 |     "110.42.101.196",
29 | ]
30 | 
31 | # 本地mysql
32 | # DATABASES = {
33 | #     "default": {
34 | #         "ENGINE": "django.db.backends.mysql",
35 | #         "NAME": "learn_spider",
36 | #         "HOST": "127.0.0.1",
37 | #         "PORT": 3306,
38 | #         "USER": "root",
39 | #         "PASSWORD": "1234",
40 | #     }
41 | # }
42 | 


--------------------------------------------------------------------------------
/LearnSpider/settings.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Django settings for LearnSpider project.
  3 | 
  4 | Generated by 'django-admin startproject' using Django 5.0.7.
  5 | 
  6 | For more information on this file, see
  7 | https://docs.djangoproject.com/en/5.0/topics/settings/
  8 | 
  9 | For the full list of settings and their values, see
 10 | https://docs.djangoproject.com/en/5.0/ref/settings/
 11 | """
 12 | 
 13 | from pathlib import Path
 14 | 
 15 | # Build paths inside the project like this: BASE_DIR / 'subdir'.
 16 | BASE_DIR = Path(__file__).resolve().parent.parent
 17 | 
 18 | # Quick-start development settings - unsuitable for production
 19 | # See https://docs.djangoproject.com/en/5.0/howto/deployment/checklist/
 20 | 
 21 | # SECURITY WARNING: keep the secret key used in production secret!
 22 | SECRET_KEY = "django-insecure-3$@35gg*j)v%o)*82^1n-x7eh!iq22!y3#g@gr35=3hazt)=!g"
 23 | 
 24 | # SECURITY WARNING: don't run with debug turned on in production!
 25 | # Application definition
 26 | 
 27 | INSTALLED_APPS = [
 28 |     "django.contrib.admin",
 29 |     "django.contrib.auth",
 30 |     "django.contrib.contenttypes",
 31 |     "django.contrib.sessions",
 32 |     "django.contrib.messages",
 33 |     "django.contrib.staticfiles",
 34 |     "rest_framework",
 35 |     "topics",
 36 |     "api",
 37 | ]
 38 | 
 39 | MIDDLEWARE = [
 40 |     "django.middleware.security.SecurityMiddleware",
 41 |     "django.contrib.sessions.middleware.SessionMiddleware",
 42 |     "django.middleware.common.CommonMiddleware",
 43 |     "django.middleware.csrf.CsrfViewMiddleware",
 44 |     "django.contrib.auth.middleware.AuthenticationMiddleware",
 45 |     "django.contrib.messages.middleware.MessageMiddleware",
 46 |     "django.middleware.clickjacking.XFrameOptionsMiddleware",
 47 | ]
 48 | 
 49 | ROOT_URLCONF = "LearnSpider.urls"
 50 | 
 51 | TEMPLATES = [
 52 |     {
 53 |         "BACKEND": "django.template.backends.django.DjangoTemplates",
 54 |         "DIRS": [],
 55 |         "APP_DIRS": True,
 56 |         "OPTIONS": {
 57 |             "context_processors": [
 58 |                 "django.template.context_processors.debug",
 59 |                 "django.template.context_processors.request",
 60 |                 "django.contrib.auth.context_processors.auth",
 61 |                 "django.contrib.messages.context_processors.messages",
 62 |             ],
 63 |         },
 64 |     },
 65 | ]
 66 | 
 67 | WSGI_APPLICATION = "LearnSpider.wsgi.application"
 68 | 
 69 | # Database
 70 | # https://docs.djangoproject.com/en/5.0/ref/settings/#databases
 71 | 
 72 | DATABASES = {
 73 |     "default": {
 74 |         "ENGINE": "django.db.backends.sqlite3",
 75 |         "NAME": BASE_DIR / "db.sqlite3",
 76 |     }
 77 | }
 78 | 
 79 | # Password validation
 80 | # https://docs.djangoproject.com/en/5.0/ref/settings/#auth-password-validators
 81 | 
 82 | AUTH_PASSWORD_VALIDATORS = [
 83 |     {
 84 |         "NAME": "django.contrib.auth.password_validation.UserAttributeSimilarityValidator",
 85 |     },
 86 |     {
 87 |         "NAME": "django.contrib.auth.password_validation.MinimumLengthValidator",
 88 |     },
 89 |     {
 90 |         "NAME": "django.contrib.auth.password_validation.CommonPasswordValidator",
 91 |     },
 92 |     {
 93 |         "NAME": "django.contrib.auth.password_validation.NumericPasswordValidator",
 94 |     },
 95 | ]
 96 | 
 97 | # Internationalization
 98 | # https://docs.djangoproject.com/en/5.0/topics/i18n/
 99 | 
100 | 
101 | USE_I18N = True
102 | TIME_ZONE = "Asia/Shanghai"
103 | USE_TZ = True
104 | 
105 | LANGUAGE_CODE = "zh-Hans"
106 | # Static files (CSS, JavaScript, Images)
107 | # https://docs.djangoproject.com/en/5.0/howto/static-files/
108 | 
109 | STATIC_URL = "static/"
110 | STATICFILES_DIRS = [
111 |     BASE_DIR / "static",
112 | ]
113 | import os
114 | 
115 | STATIC_ROOT = os.path.join(BASE_DIR, "static_root")
116 | # Default primary key field type
117 | # https://docs.djangoproject.com/en/5.0/ref/settings/#default-auto-field
118 | 
119 | DEFAULT_AUTO_FIELD = "django.db.models.BigAutoField"
120 | 
121 | DEBUG = True
122 | # DEBUG = False
123 | ALLOWED_HOSTS = [
124 |     "www.stardream.vip",
125 |     "stardream.vip",
126 |     "0.0.0.0",
127 |     "127.0.0.1",
128 |     "localhost",
129 | ]
130 | 
131 | # PORT=8001
132 | topics_path_prefix = "topic/"
133 | 
134 | # settings.py 的末尾添加以下代码
135 | 
136 | try:
137 |     from .local_settings import *
138 |     from .secret_settings import *
139 | except ImportError as e:
140 |     print(e)
141 |     pass
142 | 
143 | from dotenv import load_dotenv
144 | # 定义日志目录
145 | BASE_DIR = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
146 | LOG_DIR = os.path.join(BASE_DIR, "logs")
147 | 
148 | # 如果日志目录不存在，则创建
149 | if not os.path.exists(LOG_DIR):
150 |     os.makedirs(LOG_DIR)
151 | load_dotenv()
152 | DJANGO_ENV = os.getenv("DJANGO_ENV")
153 | if DJANGO_ENV == "local":
154 |     DEBUG = True
155 | else:
156 |     DEBUG = False
157 | 
158 |     LOGGING = {
159 |         "version": 1,
160 |         "disable_existing_loggers": False,
161 |         "formatters": {
162 |             "verbose": {
163 |                 "format": "[%(asctime)s] %(message)s",
164 |                 "datefmt": "%d/%b/%Y %H:%M:%S",
165 |             },
166 |         },
167 |         "handlers": {
168 |             "debug_file": {
169 |                 "level": "DEBUG",
170 |                 "class": "logging.FileHandler",
171 |                 "filename": os.path.join(LOG_DIR, "django_debug.log"),
172 |                 "formatter": "verbose",
173 |             },
174 |             "error_file": {
175 |                 "level": "ERROR",
176 |                 "class": "logging.FileHandler",
177 |                 "filename": os.path.join(LOG_DIR, "django_error.log"),
178 |                 "formatter": "verbose",
179 |             },
180 |         },
181 |         "loggers": {
182 |             "django": {
183 |                 "handlers": ["debug_file", "error_file"],
184 |                 "level": "DEBUG",
185 |                 "propagate": True,
186 |             },
187 |         },
188 |     }
189 | print("DEBUG",DEBUG)
190 | 


--------------------------------------------------------------------------------
/LearnSpider/urls.py:
--------------------------------------------------------------------------------
 1 | from django.contrib import admin
 2 | from django.urls import include, path, re_path
 3 | from django.views.static import serve
 4 | from LearnSpider.settings import STATIC_ROOT
 5 | 
 6 | # https://www.cnblogs.com/ddb1-1/p/12455147.html
 7 | urlpatterns = [
 8 |     path("admin/", admin.site.urls),
 9 |     path("", include("topics.urls")),
10 |     path("", include("api.urls")),
11 | ]
12 | # re_path(r'^static/(?P<path>.*)$', serve, {'document_root': STATIC_ROOT}),#static文件
13 | # 在项目根目录的 urls.py 中定义全局404处理
14 | from topics.views import error404
15 | from django.conf.urls import handler404
16 | 
17 | handler404 = error404
18 | 


--------------------------------------------------------------------------------
/LearnSpider/views.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/LearnSpider/views.py


--------------------------------------------------------------------------------
/LearnSpider/wsgi.py:
--------------------------------------------------------------------------------
 1 | """
 2 | WSGI config for LearnSpider project.
 3 | 
 4 | It exposes the WSGI callable as a module-level variable named ``application``.
 5 | 
 6 | For more information on this file, see
 7 | https://docs.djangoproject.com/en/5.0/howto/deployment/wsgi/
 8 | """
 9 | 
10 | import os
11 | 
12 | from django.core.wsgi import get_wsgi_application
13 | 
14 | os.environ.setdefault("DJANGO_SETTINGS_MODULE", "LearnSpider.settings")
15 | 
16 | application = get_wsgi_application()
17 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | <h1 align="center">爬虫百战成神 (LearnSpider)</h1>
  2 | <p align="center">
  3 | <a href="https://space.bilibili.com/1909782963">
  4 | <img src="./static/imgs/logo.jpeg" alt="StarDreamSpider" width="300" />
  5 | </a>
  6 | </p>
  7 | <p align="center"><b>来一场爬虫与成神相结合的旅行吧！</b></p>
  8 | 
  9 | ## 项目介绍
 10 | 
 11 | 爬虫百战成神（LearnSpider）是一个面向初学者到高级用户的爬虫练习网站。我们提供了多种技术示例代码、详细的文档讲解和视频演示，帮助用户从零开始学习并掌握爬虫技术。
 12 | 
 13 | ## 详细介绍
 14 | 
 15 | 这是一个使用django+drf做一个爬虫刷题网站，也就是一个靶场，我创建这个项目的代码仓库名为LearnSpider，中文叫：爬虫百战成神。
 16 | 
 17 | 它不仅是一个练习场，也配套有每道题目的多种技术示例代码，文档讲解，视频演示。题目由易到难，由浅入深，想让大家在刷题与实践的过程中甚至是从零学会爬虫（因为思想学会后，剩下的代码其实就是工具的使用），在这个过程中增加自己对于代码和场景的理解。本项目目标覆盖爬虫初级，进阶和高级。涉及到requests，scrapy这些请求工具，还有selenium，drissionpage这些自动化工具框架。涉及到接口请求，静态页面解析，也涉及到代码混淆，接口加密，也包含各种抓包工具的使用，chrome开发者工具的使用等。包括一些新颖的反爬技术，比如前端层面的反爬，svg反爬，css反爬，雪碧图等，也比如新兴的反爬技术比如wasm，总之就是我会什么，就像教大家什么。所以此仓库的内容也会无限拓展。也欢迎大家的贡献。
 18 | 
 19 | 此仓库旨在让大家在刷题的过程中以结果和成就感驱动学习，学习到某个知识点后可以快速应用，从而感受到学到了东西，爬虫是如此的简单有趣。而不是学完之后因为网站内容变动而没有刷题的地方，久而久之像没学一样。并且本项目最想让大家养成举一反三，逻辑推理的思考思维习惯。
 20 | 
 21 | 搭建此项目使用的技术栈是Django+DRF+JQuery。使用django的模板语法实现前端，使用jquery实现页面js逻辑与请求，drf实现请求限流。数据库使用sqlite。前端样式实现使用的bootstrap，本来想着手搓的，后面做的时候有感觉没必要给自己增加无意义的工作量。
 22 | 
 23 | ### TODO
 24 | 
 25 | - docker部署（我的mac好像连接不上docker的网络，暂时搁置等后面再说）
 26 | - 用户系统
 27 | 
 28 | ### 项目目标
 29 | 
 30 | - **覆盖范围**：从初级到高级的爬虫技术
 31 | - **工具与框架**：requests、scrapy、selenium、drissionpage等
 32 | - **技术点**：
 33 |     - 接口请求与静态页面解析
 34 |     - 代码混淆与接口加密
 35 |     - 各种抓包工具与Chrome开发者工具使用
 36 |     - 新颖的反爬技术（前端层面、SVG、CSS、雪碧图、WASM等）
 37 | 
 38 | ### 项目特色
 39 | 
 40 | 1. **全面覆盖**：包含从入门到高级的各类爬虫技术与工具使用。
 41 | 2. **示例丰富**：每道题目提供多种技术示例代码。
 42 | 3. **详细讲解**：文档与视频讲解，帮助理解每个技术点。
 43 | 4. **持续更新**：内容会随着新技术的出现不断扩展。
 44 | 5. **社区贡献**：欢迎大家贡献自己的题目和解法。
 45 | 
 46 | ### 学习方式
 47 | 
 48 | - 通过刷题和实践，从零开始学习爬虫技术。
 49 | - 以结果和成就感驱动学习，快速应用所学知识。
 50 | - 培养举一反三和逻辑推理的思维习惯。
 51 | 
 52 | ## 账号密码
 53 | 
 54 | LearnSpider  
 55 | LearnSpider  （线上密码已被更改）
 56 | 邮箱：cpython666@gmail.com  
 57 | 
 58 | ## 技术栈
 59 | 
 60 | - 后端框架：Django + Django REST Framework (DRF)
 61 | - 前端：使用Django模板语法
 62 | 
 63 | ## 项目结构
 64 | 
 65 | ```plaintext
 66 | LearnSpider/
 67 | ├── backend/        # 后端代码
 68 | ├── frontend/       # 前端代码
 69 | ├── templates/      # Django 模板文件
 70 | ├── static/         # 静态文件
 71 | ├── docs/           # 项目文档
 72 | ├── videos/         # 视频演示
 73 | └── README.md       # 项目说明
 74 | ```
 75 | 
 76 | ## 安装与运行
 77 | 
 78 | ### 环境要求
 79 | 
 80 | - Python 3.11+
 81 | - Django 4.2+
 82 | - Django REST Framework
 83 | 
 84 | ### 安装步骤
 85 | 
 86 | 1. 克隆项目代码：
 87 | 
 88 |    ```bash
 89 |    git clone https://github.com/cpython666/LearnSpider.git
 90 |    cd LearnSpider
 91 |    ```
 92 | 
 93 | 2. 创建并激活虚拟环境：
 94 | 
 95 |    ```bash
 96 |    python -m venv venv
 97 |    source venv/bin/activate  # 对于Windows用户：venv\Scripts\activate
 98 |    ```
 99 | 
100 | 3. 安装依赖：
101 | 
102 |    ```bash
103 |    pip install -r requirements.txt
104 |    ```
105 | 
106 | 4. 导入数据到mysql，修改数据库连接配置！！！！！！！！！！
107 | 
108 | 5. 运行数据库迁移：
109 | 
110 |    ```bash
111 |    python manage.py migrate
112 |    ```
113 | 
114 | 6. 【可选】收集静态文件。
115 | 
116 |    线上运行的时候用nginx代理静态文件；
117 | 
118 |    本地运行的时候确保debug为true，否则访问不到静态资源
119 | 
120 | ```
121 | python manage.py collectstatic --noinput
122 | ```
123 | 
124 | 
125 | 
126 | 1. 启动开发服务器：
127 | 
128 |    ```bash
129 |    python manage.py runserver
130 |    ```
131 | 
132 | 2. 在浏览器中打开 `http://127.0.0.1:8000` 查看项目。
133 | 
134 | ### docker部署
135 | 
136 | 环境:windows+dockerdesktop
137 | 启动命令
138 | 
139 | ```bash
140 | docker build -t learn-spider-app .
141 | ```
142 | 
143 | ```bash
144 | docker run -d -p 80:8000 learn-spider-app
145 | ```
146 | 
147 | ```bash
148 | docker compose up -d
149 | ```
150 | 
151 | ## 贡献指南
152 | 
153 | 1. Fork 本仓库
154 | 2. 创建一个新的分支 (`git checkout -b feature/你的特性`)
155 | 3. 提交你的更改 (`git commit -am '添加了新的功能'`)
156 | 4. 推送到分支 (`git push origin feature/你的特性`)
157 | 5. 创建一个新的 Pull Request
158 | 
159 | ## 联系我们
160 | 
161 | 如有任何问题或建议，请通过以下方式联系我们：
162 | 
163 | - Email: 你的邮箱@example.com
164 | - GitHub Issues: https://github.com/你的用户名/LearnSpider/issues
165 | 
166 | ---
167 | 
168 | ### 建议
169 | 
170 | 1. **用户体验优化**：虽然前端使用Django模板语法，但可以考虑引入一些现代的前端库和框架，如Bootstrap或Tailwind CSS，以提升用户体验。
171 | 2. **单元测试与持续集成**：增加单元测试，使用CI工具如Travis CI或GitHub Actions，确保代码质量。
172 | 3. **文档与教程**：持续完善文档，增加更多详细的教程和示例代码，帮助用户更好地理解和应用技术。
173 | 4. **社区互动**：建立一个论坛或使用GitHub Discussions，促进用户间的交流与分享。
174 | 5. **安全性与性能优化**：关注爬虫的安全性，避免被反爬机制检测，并优化性能，提升爬取效率。
175 | 
176 | 希望这些建议对你的项目有所帮助！如果有更多问题，随时联系我。
177 | 
178 | **注意：** 该项目仅供学习和交流使用，不得用于非法活动。作者对任何滥用项目所导致的问题概不负责。
179 | 
180 | ### 常用工具命令
181 | 
182 | 根据难度分数计算显示顺序
183 | 
184 | ```bash
185 | python manage.py update_pass_status
186 | ```
187 | 
188 | 迁移模型
189 | 
190 | ```bash
191 | python manage.py makemigrations
192 | python manage.py migrate
193 | ```
194 | 
195 | ```bash
196 | #更新题目的显示顺序id
197 | python manage.py update_difficulty_scores
198 | python manage.py update_order_ids
199 | ```
200 | 
201 | ## 项目赞助
202 | 
203 | 赞助支持可以备注github名，会显示在下方列表
204 | 
205 | | 日期         | 姓名                                           | 金额 | 
206 | |------------|----------------------------------------------|----|
207 | | 2024.08.20 | [@cpython666](https://github.com/cpython666) | ￥0 |
208 | 
209 | <p style="display: flex;">
210 | 
211 |   <img src="static/imgs/support/wx.jpg" alt="微信" width="350" />
212 |   <img src="static/imgs/support/zfb.jpg" alt="支付宝" width="350" />
213 | </p>
214 | 
215 | ## 部署时
216 | 
217 | ### 收集静态文件
218 | 
219 | ```bash
220 | python manage.py collectstatic --noinput
221 | ```
222 | 
223 | ## 部署时nginx配置
224 | 
225 | ```
226 | server {
227 |     listen 80;
228 |     server_name learnspider.vip;
229 | 
230 |     location / {
231 |         proxy_pass http://127.0.0.1:8001;  # 反向代理到 Django 服务器
232 |         proxy_set_header Host $host;
233 |         proxy_set_header X-Real-IP $remote_addr;
234 |         proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
235 |         proxy_set_header X-Forwarded-Proto $scheme;
236 | 
237 |         # 防止 WebSocket 断开（可选，若有 WebSocket 需求）
238 |         proxy_http_version 1.1;
239 |         proxy_set_header Upgrade $http_upgrade;
240 |         proxy_set_header Connection "Upgrade";
241 |     }
242 | 
243 |     # 处理静态文件（如果 Django 直接提供静态文件，可以忽略）
244 |     location /static/ {
245 |         alias /usr/local/projects/learnspider_static/;
246 |     }
247 | 
248 |     location /media/ {
249 |         alias /path/to/your/media/;
250 |     }
251 | }
252 | ```


--------------------------------------------------------------------------------
/api/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/api/__init__.py


--------------------------------------------------------------------------------
/api/admin.py:
--------------------------------------------------------------------------------
1 | from django.contrib import admin
2 | 
3 | # Register your models here.
4 | 


--------------------------------------------------------------------------------
/api/apps.py:
--------------------------------------------------------------------------------
1 | from django.apps import AppConfig
2 | 
3 | 
4 | class ApiConfig(AppConfig):
5 |     default_auto_field = "django.db.models.BigAutoField"
6 |     name = "api"
7 | 


--------------------------------------------------------------------------------
/api/migrations/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/api/migrations/__init__.py


--------------------------------------------------------------------------------
/api/models.py:
--------------------------------------------------------------------------------
1 | from django.db import models
2 | 
3 | # Create your models here.
4 | 


--------------------------------------------------------------------------------
/api/tests.py:
--------------------------------------------------------------------------------
1 | from django.test import TestCase
2 | 
3 | # Create your tests here.
4 | 


--------------------------------------------------------------------------------
/api/urls.py:
--------------------------------------------------------------------------------
 1 | from django.urls import include
 2 | from django.urls import path
 3 | from rest_framework.routers import DefaultRouter
 4 | 
 5 | from . import views
 6 | from .views import TopicsViewSet
 7 | from .views import check_answer
 8 | 
 9 | router = DefaultRouter()
10 | router.register(r"api/topics", TopicsViewSet)
11 | 
12 | urlpatterns = [
13 |     # 关于题目模型的的api接口
14 |     path("", include(router.urls)),
15 |     # ---------------页面所需的数据接口------开始-----
16 |     path("api/ajax/", views.ajax, name="ajax"),
17 |     path("api/pagination1/<int:pageNo>/", views.pagination1, name="pagination1"),
18 |     path(
19 |         "api/pagination_table/<int:page>/",
20 |         views.pagination_table,
21 |         name="pagination_table",
22 |     ),
23 |     path("api/pagination1/<int:pageNo>/", views.pagination1, name="pagination1"),
24 |     path("api/post_intro_json/", views.post_intro_json, name="post_intro_json"),
25 |     path("api/post_intro_form/", views.post_intro_form, name="post_intro_form"),
26 |     # ---------------页面所需的数据接口--------结束--------
27 |     # ------------------工具接口--------------------
28 |     path("api/delay/<int:delay_time>/", views.delay, name="delay"),
29 |     # 延迟多少秒返回结果
30 |     path("api/delay/<int:delay_time>/", views.delay, name="delay"),
31 |     # 返回请求客户端的IP
32 |     path("api/ip/", views.get_client_ip, name="get_client_ip"),
33 |     # 检查答案是否正确
34 |     path("api/check-answer/", check_answer, name="check_answer"),
35 |     path("api/server_time/", views.get_server_time, name="get_server_time"),
36 |     path("api/ua/", views.get_user_agent, name="get_user_agent"),
37 |     path("api/health/", views.health_check, name="health_check"),
38 |     path("api/headers/", views.get_request_headers, name="get_request_headers"),
39 |     path("api/reverse_string/", views.reverse_string, name="reverse_string"),
40 |     path("api/base64_encode/", views.base64_encode, name="base64_encode"),
41 |     path("api/base64_decode/", views.base64_decode, name="base64_decode"),
42 |     # 返回服务器的时间戳，加密格式
43 |     path(
44 |         "api/server-timestamp/", views.get_server_timestamp, name="get_server_timestamp"
45 |     ),
46 |     # ------------------工具接口--------------------
47 | ]
48 | 


--------------------------------------------------------------------------------
/collect_data/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/collect_data/__init__.py


--------------------------------------------------------------------------------
/collect_data/collect_news.py:
--------------------------------------------------------------------------------
 1 | import requests
 2 | from pprint import pprint
 3 | from topics.models import Topics, News, NewsCategory, NewsPlatform
 4 | 
 5 | 
 6 | def fetch_platform_news(platform_slug):
 7 |     # 来源：https://hot.hlds.fun/#/
 8 |     url = f"https://dailyhotapi.hlds.fun/{platform_slug}"
 9 |     print(url)
10 |     response = requests.get(url)
11 |     if response.status_code == 200:
12 |         res = response.json()
13 |         data = res["data"]
14 |         # pprint(data)
15 |         res = []
16 |         for _ in data:
17 |             if type(_["timestamp"]) != "int":
18 |                 _["timestamp"] = None
19 |             res.append(
20 |                 {
21 |                     "title": _["title"],
22 |                     "url": _["url"],
23 |                     "timestamp": _["timestamp"],
24 |                     "hot": _.get("hot"),
25 |                     "desc": _.get("desc"),
26 |                 }
27 |             )
28 |         return res
29 |     else:
30 |         print(response, response.text)
31 | 
32 | 
33 | def get_all_platforms():
34 |     platforms = NewsPlatform.objects.values_list("slug", flat=True).all()
35 |     return list(platforms)
36 | 
37 | 
38 | if __name__ == "__main__":
39 |     get_all_platforms()
40 | 


--------------------------------------------------------------------------------
/collect_data/collect_news_binance.py:
--------------------------------------------------------------------------------
 1 | import requests
 2 | from topics.models import Web3NewsTag
 3 | from pprint import pprint
 4 | from urllib.parse import quote
 5 | from datetime import datetime
 6 | 
 7 | 
 8 | class BianNewsSpider:
 9 |     def __init__(self):
10 |         self.headers = {"clienttype": "web", "lang": "zh-cn"}
11 |         self.headers_en = {
12 |             "clienttype": "web",
13 |         }
14 |         self.id_info_mapping = self.merge_tags()
15 | 
16 |     def fetch_tags(self, en=False):
17 |         json_data = {}
18 |         response = requests.post(
19 |             "https://www.binance.com/bapi/composite/v1/friendly/pgc/news/tags",
20 |             headers=self.headers_en if en else self.headers,
21 |             json=json_data,
22 |         )
23 |         if response.status_code != 200:
24 |             raise Exception("请求失败：", response.status_code, response.text)
25 |         else:
26 |             res = response.json()
27 |             tags = res["data"]["data"]
28 |             return {_["id"]: _ for _ in tags}
29 | 
30 |     def merge_tags(self):
31 |         tags = list(Web3NewsTag.objects.values_list("tag", flat=True).all())
32 |         id_info_mapping = self.fetch_tags()
33 |         id_info_mapping_en = self.fetch_tags(en=True)
34 |         for tag_id, info in id_info_mapping.items():
35 |             if tag_id in id_info_mapping_en:
36 |                 info_en = id_info_mapping_en[tag_id]
37 |                 info_en.pop("id")
38 |                 info_en.pop("tag")
39 |                 info |= {f"{k}_en": v for k, v in info_en.items()}
40 |                 id_info_mapping[tag_id] = info
41 |             if info.get("tag") in tags:
42 |                 continue
43 |             else:
44 |                 Web3NewsTag.objects.create(
45 |                     tag_id=info.get("id"),
46 |                     name=info.get("name"),
47 |                     desc=info.get("description"),
48 |                     tag=info.get("tag"),
49 |                     name_en=info.get("name_en"),
50 |                     desc_en=info.get("description_en"),
51 |                     url=f"https://www.binance.com/zh-CN/square/news/{quote(info.get('tag').lower())}",
52 |                 )
53 |         return id_info_mapping
54 | 
55 |     def fetch_new_by_tag(self, last_time=None):
56 |         if not last_time:
57 |             page_num = 100
58 |         else:
59 |             page_num = 0
60 |         params = {
61 |             "pageIndex": "1",
62 |             "pageSize": "20",
63 |             "tagId": "15",
64 |         }
65 |         response = requests.get(
66 |             "https://www.binance.com/bapi/composite/v4/friendly/pgc/feed/news/list",
67 |             params=params,
68 |             headers=self.headers,
69 |         )
70 |         if response.status_code != 200:
71 |             raise Exception("请求失败", response.status_code, response.text)
72 |         res = response.json()
73 |         data = res["data"]["vos"]
74 |         pprint(data)
75 | 
76 |         news_lst = [
77 |             {
78 |                 "title": _["title"],
79 |                 "subTitle": _["subTitle"],
80 |                 "webLink": _["webLink"],
81 |                 "authorName": _["title"],
82 |                 "published_time": datetime.fromtimestamp(_["date"]),
83 |             }
84 |             for _ in data
85 |         ]
86 |         pprint(news_lst)
87 |         for news in news_lst:
88 |             if news["published_time"] <= last_time:
89 |                 break
90 | 
91 |         # pprint(response.json())
92 | 
93 | 
94 | # if __name__ == '__main__':
95 | #     spider = BianNewsSpider()
96 | #     print(spider.tags)
97 | 


--------------------------------------------------------------------------------
/collect_data/collect_news_block_beats.py:
--------------------------------------------------------------------------------
 1 | import requests
 2 | from pprint import pprint
 3 | 
 4 | params = {
 5 |     'is_import': '0',
 6 |     'page': '1',
 7 |     'type': '0',
 8 | }
 9 | 
10 | response = requests.get('https://appapi.blockbeats.cn/v6/flash/list', params=params)
11 | res = response.json()
12 | if res["status"] == 0:
13 |     data = res["data"]
14 |     total = data["total"]
15 |     total_page = data["totalPage"]
16 |     data_lst = data["data"]
17 |     for data_item in data_lst:
18 |         id = data_item["id"]
19 |         url = data_item["h5"]
20 |         title = data_item["title"]
21 |         content = data_item["content"]
22 |         time_str = data_item["time"]
23 |         add_time = data_item["add_time"]
24 |         rich_text = data_item["rich_text"]
25 | 
26 | pprint(res)
27 | print(res.keys())
28 | 


--------------------------------------------------------------------------------
/docker-compose.yml:
--------------------------------------------------------------------------------
 1 | version: '3.8'
 2 | 
 3 | services:
 4 |   web:
 5 |     image: python:3.11-slim
 6 |     container_name: learn_spider_app
 7 |     restart: unless-stopped
 8 |     working_dir: /app
 9 |     volumes:
10 |       - .:/app  # 映射当前目录
11 |     ports:
12 |       - "8001:8001"
13 |     environment:
14 |       - PYTHONUNBUFFERED=1
15 |     command: >
16 |       bash -c "
17 |         pip install --no-cache-dir -r /app/requirements.txt -i https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple &&
18 |         python /app/manage.py collectstatic --noinput &&  # 收集静态文件
19 |         python /app/manage.py runserver 0.0.0.0:8001  # 使用 6666 端口
20 |       "
21 | 


--------------------------------------------------------------------------------
/docs/开发者文档.md:
--------------------------------------------------------------------------------
 1 | ## 写在前面
 2 | 
 3 | 或许是受够了没有文档的项目，所以自己的项目一定要有文档。  
 4 | 可以说我的文档写的不好，但我会尽我所能写好文档。
 5 | 
 6 | ## 文档
 7 | 
 8 | ## 题目地址
 9 | 
10 | 由两部分组成，分别是response_path和api_prefix  
11 | response_path就是题目链接的后缀  
12 | 而api_prefix是题目链接的前缀，也就是题目接口的类型  
13 | 目前题目类型分为三种：
14 | 
15 | - url/：题目链接不是本项目提供，跳转到一个公网url，比如序言中会有很多文档写在github，那么会重定向过去
16 | - page/：【静态页面】题目只有一个静态html，这样则可以直接通过一个视图返回一个静态的html页面，也包括注入python代码片段的页面。页面存放在topics/pages文件夹中。
17 | - view/：【需要django渲染数据进模板】题目需要通过单独的django视图控制，像校验ua，或者请求头中一些参数的时候，之后再返回页面。页面存放在topics/views文件夹中。
18 | - 可能还会有一种题目，需要大量的页面，目前还没设计，取个什么前缀名好呢🤔。
19 | 
20 | ## 一些工具接口
21 | 
22 | > 以 /api 开头
23 | 
24 | - 返回请求客户端的ip http://localhost:8001/api/ip/
25 | - 返回ua http://localhost:8001/api/ua/
26 | - 返回请求头 http://localhost:8001/api/headers/
27 | - 返回服务器时间 http://localhost:8001/api/server_time/
28 | - 加密返回服务器时间 http://localhost:8001/api/server-timestamp/
29 | - 返回服务器的健康状态 http://localhost:8001/api/health/
30 | - 延迟多少秒返回结果 http://localhost:8001/api/delay/3/
31 | - base64加密 http://localhost:8001/api/base64_encode/
32 | - base64解密 http://localhost:8001/api/base64_decode/
33 | - 反转字符串 http://localhost:8001/api/reverse_string/
34 | 
35 | # 关于题目模型的的api接口
36 | 
37 | ## 细碎重要点‼️
38 | 
39 | -
40 | 页面的标题【title标签里面的内容】需要与数据库中的title字段保持一致【html中空格换行会被去除】，因为回答问题发送的请求会携带答案和页面的title字段去数据库中找到对应的问题，然后找到答案，对比答案...很蠢，但没办法。没想到更好的解决办法。传id意味着还需要吧id传进去。视图函数类型又多。id的序号也乱，因为会中间加题。


--------------------------------------------------------------------------------
/logs/django_error.log:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/logs/django_error.log


--------------------------------------------------------------------------------
/manage.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | """Django's command-line utility for administrative tasks."""
 3 | import os
 4 | import sys
 5 | 
 6 | BANNER = r"""
 7 |                          _     _                         __      __      __  
 8 |                         | |   | |                       / /     / /     / /  
 9 |    ___   _ __    _   _  | |_  | |__     ___    _ __    / /_    / /_    / /_  
10 |   / __| | '_ \  | | | | | __| | '_ \   / _ \  | '_ \  | '_ \  | '_ \  | '_ \ 
11 |  | (__  | |_) | | |_| | | |_  | | | | | (_) | | | | | | (_) | | (_) | | (_) |
12 |   \___| | .__/   \__, |  \__| |_| |_|  \___/  |_| |_|  \___/   \___/   \___/ 
13 |         | |       __/ |                                                      
14 |         |_|      |___/                                                       
15 | 访问我的博客：https://cpython666.github.io/
16 | 访问我的博客：https://stardreamfly.github.io/
17 | """
18 | 
19 | 
20 | def main():
21 |     """Run administrative tasks."""
22 |     os.environ.setdefault("DJANGO_SETTINGS_MODULE", "LearnSpider.settings")
23 |     try:
24 |         from django.core.management import execute_from_command_line
25 |     except ImportError as exc:
26 |         raise ImportError(
27 |             "Couldn't import Django. Are you sure it's installed and "
28 |             "available on your PYTHONPATH environment variable? Did you "
29 |             "forget to activate a virtual environment?"
30 |         ) from exc
31 |     if "runserver" in sys.argv:
32 |         if not os.environ.get("RUN_MAIN", None):
33 |             print(BANNER)  # Print the banner only if RUN_MAIN is not set
34 |     else:
35 |         print(BANNER)
36 |     execute_from_command_line(sys.argv)
37 | 
38 | 
39 | if __name__ == "__main__":
40 |     main()
41 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | Django==5.0.7
2 | DrissionPage==4.1.0.17
3 | PyMySQL==1.1.1
4 | python-dotenv==1.0.1
5 | Requests==2.32.3
6 | djangorestframework
7 | apscheduler==3.11.0
8 | redis
9 | invoke


--------------------------------------------------------------------------------
/spider_demo/demo/demo/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/spider_demo/demo/demo/__init__.py


--------------------------------------------------------------------------------
/spider_demo/demo/demo/items.py:
--------------------------------------------------------------------------------
 1 | # Define here the models for your scraped items
 2 | #
 3 | # See documentation in:
 4 | # https://docs.scrapy.org/en/latest/topics/items.html
 5 | 
 6 | import scrapy
 7 | 
 8 | 
 9 | class NewsItem(scrapy.Item):
10 |     title = scrapy.Field()  # 新闻标题
11 |     url = scrapy.Field()  # 新闻链接
12 | 


--------------------------------------------------------------------------------
/spider_demo/demo/demo/middlewares.py:
--------------------------------------------------------------------------------
  1 | # Define here the models for your spider middleware
  2 | #
  3 | # See documentation in:
  4 | # https://docs.scrapy.org/en/latest/topics/spider-middleware.html
  5 | 
  6 | from scrapy import signals
  7 | 
  8 | # useful for handling different item types with a single interface
  9 | from itemadapter import is_item, ItemAdapter
 10 | 
 11 | 
 12 | class DemoSpiderMiddleware:
 13 |     # Not all methods need to be defined. If a method is not defined,
 14 |     # scrapy acts as if the spider middleware does not modify the
 15 |     # passed objects.
 16 | 
 17 |     @classmethod
 18 |     def from_crawler(cls, crawler):
 19 |         # This method is used by Scrapy to create your spiders.
 20 |         s = cls()
 21 |         crawler.signals.connect(s.spider_opened, signal=signals.spider_opened)
 22 |         return s
 23 | 
 24 |     def process_spider_input(self, response, spider):
 25 |         # Called for each response that goes through the spider
 26 |         # middleware and into the spider.
 27 | 
 28 |         # Should return None or raise an exception.
 29 |         return None
 30 | 
 31 |     def process_spider_output(self, response, result, spider):
 32 |         # Called with the results returned from the Spider, after
 33 |         # it has processed the response.
 34 | 
 35 |         # Must return an iterable of Request, or item objects.
 36 |         for i in result:
 37 |             yield i
 38 | 
 39 |     def process_spider_exception(self, response, exception, spider):
 40 |         # Called when a spider or process_spider_input() method
 41 |         # (from other spider middleware) raises an exception.
 42 | 
 43 |         # Should return either None or an iterable of Request or item objects.
 44 |         pass
 45 | 
 46 |     def process_start_requests(self, start_requests, spider):
 47 |         # Called with the start requests of the spider, and works
 48 |         # similarly to the process_spider_output() method, except
 49 |         # that it doesn’t have a response associated.
 50 | 
 51 |         # Must return only requests (not items).
 52 |         for r in start_requests:
 53 |             yield r
 54 | 
 55 |     def spider_opened(self, spider):
 56 |         spider.logger.info("Spider opened: %s" % spider.name)
 57 | 
 58 | 
 59 | class DemoDownloaderMiddleware:
 60 |     # Not all methods need to be defined. If a method is not defined,
 61 |     # scrapy acts as if the downloader middleware does not modify the
 62 |     # passed objects.
 63 | 
 64 |     @classmethod
 65 |     def from_crawler(cls, crawler):
 66 |         # This method is used by Scrapy to create your spiders.
 67 |         s = cls()
 68 |         crawler.signals.connect(s.spider_opened, signal=signals.spider_opened)
 69 |         return s
 70 | 
 71 |     def process_request(self, request, spider):
 72 |         # Called for each request that goes through the downloader
 73 |         # middleware.
 74 | 
 75 |         # Must either:
 76 |         # - return None: continue processing this request
 77 |         # - or return a Response object
 78 |         # - or return a Request object
 79 |         # - or raise IgnoreRequest: process_exception() methods of
 80 |         #   installed downloader middleware will be called
 81 |         print("请求之前")
 82 |         return None
 83 | 
 84 |     def process_response(self, request, response, spider):
 85 |         # Called with the response returned from the downloader.
 86 | 
 87 |         # Must either;
 88 |         # - return a Response object
 89 |         # - return a Request object
 90 |         # - or raise IgnoreRequest
 91 |         print("响应之后")
 92 |         return response
 93 | 
 94 |     def process_exception(self, request, exception, spider):
 95 |         # Called when a download handler or a process_request()
 96 |         # (from other downloader middleware) raises an exception.
 97 | 
 98 |         # Must either:
 99 |         # - return None: continue processing this exception
100 |         # - return a Response object: stops process_exception() chain
101 |         # - return a Request object: stops process_exception() chain
102 |         pass
103 | 
104 |     def spider_opened(self, spider):
105 |         spider.logger.info("Spider opened: %s" % spider.name)
106 | 


--------------------------------------------------------------------------------
/spider_demo/demo/demo/pipelines.py:
--------------------------------------------------------------------------------
 1 | # Define your item pipelines here
 2 | #
 3 | # Don't forget to add your pipeline to the ITEM_PIPELINES setting
 4 | # See: https://docs.scrapy.org/en/latest/topics/item-pipeline.html
 5 | 
 6 | 
 7 | # useful for handling different item types with a single interface
 8 | from itemadapter import ItemAdapter
 9 | 
10 | 
11 | class NewsPipeline:
12 |     def process_item(self, item, spider):
13 |         # 数据清洗或验证的逻辑
14 |         item["title"] = item["title"].strip()  # 去除标题前后的空格
15 |         print(f"pipeline item: {item}")
16 |         return item
17 | 


--------------------------------------------------------------------------------
/spider_demo/demo/demo/settings.py:
--------------------------------------------------------------------------------
 1 | # Scrapy settings for demo project
 2 | #
 3 | # For simplicity, this file contains only settings considered important or
 4 | # commonly used. You can find more settings consulting the documentation:
 5 | #
 6 | #     https://docs.scrapy.org/en/latest/topics/settings.html
 7 | #     https://docs.scrapy.org/en/latest/topics/downloader-middleware.html
 8 | #     https://docs.scrapy.org/en/latest/topics/spider-middleware.html
 9 | 
10 | BOT_NAME = "demo"
11 | 
12 | SPIDER_MODULES = ["demo.spiders"]
13 | NEWSPIDER_MODULE = "demo.spiders"
14 | 
15 | # Crawl responsibly by identifying yourself (and your website) on the user-agent
16 | # USER_AGENT = "demo (+http://www.yourdomain.com)"
17 | 
18 | # Obey robots.txt rules
19 | ROBOTSTXT_OBEY = False
20 | # ROBOTSTXT_OBEY = True
21 | 
22 | # Configure maximum concurrent requests performed by Scrapy (default: 16)
23 | # CONCURRENT_REQUESTS = 32
24 | 
25 | # Configure a delay for requests for the same website (default: 0)
26 | # See https://docs.scrapy.org/en/latest/topics/settings.html#download-delay
27 | # See also autothrottle settings and docs
28 | # DOWNLOAD_DELAY = 3
29 | # The download delay setting will honor only one of:
30 | # CONCURRENT_REQUESTS_PER_DOMAIN = 16
31 | # CONCURRENT_REQUESTS_PER_IP = 16
32 | 
33 | # Disable cookies (enabled by default)
34 | # COOKIES_ENABLED = False
35 | 
36 | # Disable Telnet Console (enabled by default)
37 | # TELNETCONSOLE_ENABLED = False
38 | 
39 | # Override the default request headers:
40 | # DEFAULT_REQUEST_HEADERS = {
41 | #    "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8",
42 | #    "Accept-Language": "en",
43 | # }
44 | 
45 | # Enable or disable spider middlewares
46 | # See https://docs.scrapy.org/en/latest/topics/spider-middleware.html
47 | # SPIDER_MIDDLEWARES = {
48 | #    "demo.middlewares.DemoSpiderMiddleware": 543,
49 | # }
50 | 
51 | # Enable or disable downloader middlewares
52 | # See https://docs.scrapy.org/en/latest/topics/downloader-middleware.html
53 | # DOWNLOADER_MIDDLEWARES = {
54 | #    "demo.middlewares.DemoDownloaderMiddleware": 543,
55 | # }
56 | 
57 | # Enable or disable extensions
58 | # See https://docs.scrapy.org/en/latest/topics/extensions.html
59 | # EXTENSIONS = {
60 | #    "scrapy.extensions.telnet.TelnetConsole": None,
61 | # }
62 | 
63 | # Configure item pipelines
64 | # See https://docs.scrapy.org/en/latest/topics/item-pipeline.html
65 | # ITEM_PIPELINES = {
66 | #    "demo.pipelines.DemoPipeline": 300,
67 | # }
68 | 
69 | 
70 | # Enable and configure the AutoThrottle extension (disabled by default)
71 | # See https://docs.scrapy.org/en/latest/topics/autothrottle.html
72 | # AUTOTHROTTLE_ENABLED = True
73 | # The initial download delay
74 | # AUTOTHROTTLE_START_DELAY = 5
75 | # The maximum download delay to be set in case of high latencies
76 | # AUTOTHROTTLE_MAX_DELAY = 60
77 | # The average number of requests Scrapy should be sending in parallel to
78 | # each remote server
79 | # AUTOTHROTTLE_TARGET_CONCURRENCY = 1.0
80 | # Enable showing throttling stats for every response received:
81 | # AUTOTHROTTLE_DEBUG = False
82 | 
83 | # Enable and configure HTTP caching (disabled by default)
84 | # See https://docs.scrapy.org/en/latest/topics/downloader-middleware.html#httpcache-middleware-settings
85 | # HTTPCACHE_ENABLED = True
86 | # HTTPCACHE_EXPIRATION_SECS = 0
87 | # HTTPCACHE_DIR = "httpcache"
88 | # HTTPCACHE_IGNORE_HTTP_CODES = []
89 | # HTTPCACHE_STORAGE = "scrapy.extensions.httpcache.FilesystemCacheStorage"
90 | 
91 | # Set settings whose default value is deprecated to a future-proof value
92 | TWISTED_REACTOR = "twisted.internet.asyncioreactor.AsyncioSelectorReactor"
93 | FEED_EXPORT_ENCODING = "utf-8"
94 | 


--------------------------------------------------------------------------------
/spider_demo/demo/demo/spiders/__init__.py:
--------------------------------------------------------------------------------
1 | # This package will contain the spiders of your Scrapy project
2 | #
3 | # Please refer to the documentation for information on how to create and manage
4 | # your spiders.
5 | 


--------------------------------------------------------------------------------
/spider_demo/demo/demo/spiders/hello_scrapy.py:
--------------------------------------------------------------------------------
 1 | from typing import Iterable
 2 | 
 3 | import scrapy
 4 | from scrapy import Request
 5 | 
 6 | 
 7 | class HelloScrapySpider(scrapy.Spider):
 8 |     name = "hello_scrapy"
 9 |     # allowed_domains = ["baidu.com"]
10 |     start_urls = ["https://cn.bing.com/"]
11 | 
12 |     def start_requests(self) -> Iterable[Request]:
13 |         yield Request("http://localhost:8001/", callback=self.parse)
14 | 
15 |     def parse(self, response):
16 |         print(1, response)
17 |         print(response.css(".h1::text").get())
18 |         urls = [
19 |             "http://localhost:8001/?sort=asc&param=1",
20 |             "http://localhost:8001/?param=1&sort=asc",
21 |         ]
22 |         for url in urls:
23 |             yield scrapy.Request(
24 |                 url, callback=self.parse_local, meta={"aaa": 111}, dont_filter=True
25 |             )
26 | 
27 |     def parse_local(self, response):
28 |         print("请求了一次")
29 |         # print(response.meta.get('aaa'))
30 |         # print(response)
31 | 


--------------------------------------------------------------------------------
/spider_demo/demo/demo/spiders/parse_demo.py:
--------------------------------------------------------------------------------
 1 | import scrapy
 2 | from demo.items import NewsItem
 3 | 
 4 | 
 5 | class ParseDemoSpider(scrapy.Spider):
 6 |     custom_settings = {
 7 |         # "ITEM_PIPELINES": {
 8 |         #     'demo.pipelines.NewsPipeline': 1,  # 启用 NewsPipeline
 9 |         # },
10 |         # "DOWNLOADER_MIDDLEWARES": {
11 |         #     'demo.middlewares.DemoDownloaderMiddleware': 543
12 |         # }
13 |     }
14 | 
15 |     name = "parse_demo"
16 |     start_urls = ["http://localhost:8001/sandbox/news/hot/"]
17 | 
18 |     def parse(self, response):
19 |         card_lst = response.css(".card-body")
20 |         for card in card_lst:
21 |             # item = NewsItem()
22 |             # item['title'] = card.css('a span::text').get()
23 |             # item['url'] = card.css('a::attr(href)').get()
24 |             yield {
25 |                 "title": card.css("a span::text").get(),
26 |                 "url": card.css("a::attr(href)").get(),
27 |             }
28 |             # print(card.css('a span::text').get(), card.css('a::attr(href)').get())
29 |             # yield item
30 | 
31 | 
32 | if __name__ == "__main__":
33 |     from scrapy import Selector
34 | 
35 |     text = "<a>111</a>"
36 |     response = Selector(text=text)
37 |     print(response.xpath("//a/text()").get())
38 | 


--------------------------------------------------------------------------------
/spider_demo/demo/demo/spiders/post_spider.py:
--------------------------------------------------------------------------------
 1 | import scrapy
 2 | import json
 3 | 
 4 | 
 5 | class JsonRequestSpider(scrapy.Spider):
 6 |     name = "json_spider"
 7 | 
 8 |     start_urls = ["http://localhost:8001/api/post_intro_json/"]
 9 | 
10 |     def start_requests(self):
11 |         # JSON 数据
12 |         data = {
13 |             "password": "post",
14 |         }
15 | 
16 |         # 请求头，指定发送 JSON 数据
17 |         headers = {
18 |             "Content-Type": "application/json",
19 |         }
20 | 
21 |         # 发送 POST 请求
22 |         yield scrapy.Request(
23 |             url=self.start_urls[0],
24 |             method="POST",
25 |             headers=headers,
26 |             body=json.dumps(data),  # 将字典转换为 JSON 字符串
27 |             callback=self.parse,
28 |         )
29 | 
30 |     def parse(self, response):
31 |         # 解析响应数据
32 |         data = json.loads(response.text)
33 |         self.log(f"响应数据: {data}")
34 | 
35 | 
36 | class FormRequestSpider(scrapy.Spider):
37 |     name = "form_spider"
38 | 
39 |     start_urls = ["http://localhost:8001/api/post_intro_form/"]
40 | 
41 |     def start_requests(self):
42 |         # JSON 数据
43 |         formdata = {
44 |             "password": "post",
45 |         }
46 | 
47 |         # 发送 POST 请求
48 |         yield scrapy.FormRequest(
49 |             url=self.start_urls[0],
50 |             method="POST",
51 |             formdata=formdata,  # 将字典转换为 JSON 字符串
52 |             callback=self.parse,
53 |         )
54 | 
55 |     def parse(self, response):
56 |         # 解析响应数据
57 |         data = json.loads(response.text)
58 |         self.log(f"响应数据: {data}")
59 | 


--------------------------------------------------------------------------------
/spider_demo/demo/output.json:
--------------------------------------------------------------------------------
 1 | [
 2 | {"title": "研究二次元的专家", "url": "https://b23.tv/BV1L6PKeyEpF"},
 3 | {"title": "春天的第一次公路旅行", "url": "https://www.douyin.com/hot/2009696"},
 4 | {"title": "博士配偶为初中学历被安排工作，湖北师范大学回应「符合政策，属劳务派遣」，怎样看待此事？", "url": "https://www.zhihu.com/question/13286722569"},
 5 | {"title": "老人离世4名后人治丧后意外身亡", "url": "https://www.baidu.com/s?wd=%E8%80%81%E4%BA%BA%E7%A6%BB%E4%B8%964%E5%90%8D%E5%90%8E%E4%BA%BA%E6%B2%BB%E4%B8%A7%E5%90%8E%E6%84%8F%E5%A4%96%E8%BA%AB%E4%BA%A1"},
 6 | {"title": "刚刚，全球首个混合推理模型Claude 3.7降世！最强编程大脑暴击DeepSeek R1", "url": "https://www.36kr.com/p/3181320656196736"},
 7 | {"title": "华为余承东预告“想不到的产品”：首款为原生鸿蒙而生的新形态手机 3 月见", "url": "https://www.ithome.com/0/833/121.htm"},
 8 | {"title": "本周看什么 | 最近值得一看的 9 部作品", "url": "https://sspai.com/post/96593"},
 9 | {"title": "中美俄均投下赞成票，联合国安理会通过涉乌决议", "url": "https://www.thepaper.cn/newsDetail_forward_30236174"},
10 | {"title": "中美俄立场罕见一致释放什么信号", "url": "https://www.toutiao.com/trending/7475304273840983578/"},
11 | {"title": "王祖贤在贴吧官宣创业", "url": "https://tieba.baidu.com/hottopic/browse/hottopic?topic_id=28339488&amp;topic_name=%E7%8E%8B%E7%A5%96%E8%B4%A4%E5%9C%A8%E8%B4%B4%E5%90%A7%E5%AE%98%E5%AE%A3%E5%88%9B%E4%B8%9A"},
12 | {"title": "MobVue 开源啦！", "url": "https://juejin.cn/post/7474782353463787556"},
13 | {"title": "【6.9】误判", "url": "https://movie.douban.com/subject/36401937/"},
14 | {"title": "总书记关心的事丨“绿电”点亮班彦村", "url": "https://new.qq.com/rain/a/20250225A01EPV00"},
15 | {"title": "男子夜晚去找小三偷情 上门发现小三正和情人发生关系", "url": "https://www.163.com/dy/article/JP8MH31K0523WUD9.html"},
16 | {"title": "AI未来进行式（DeepSeek、宇树科技、人形机器人、AI面试官……本书全部预言）", "url": "https://weread.qq.com/web/bookDetail/0bc32b20813ab6d9fg0114c1"},
17 | {"title": "2025年2月25日 不停机更新 ", "url": "https://lol.qq.com/news/detail.shtml?docid=13900088934026462960"},
18 | {"title": "3.1版本活动跃迁 | 第一期", "url": "https://www.miyoushe.com/sr/article/62249173"},
19 | {"title": "「征战勇者淬炼之界」活动：突破试炼得名片", "url": "https://www.miyoushe.com/ys/article/62181653"},
20 | {"title": "关于我就是李大嘴的几点原因", "url": "https://www.douban.com/group/topic/319699118/?_spm_id=MTIzMDA2NjUx"},
21 | {"title": "AI 训练跟踪与可视化平台", "url": "https://hellogithub.com/repository/b442a9fa270e4ccb8847c9ee3445e41b"},
22 | {"title": "开普勒当时是如何计算出行星轨道是椭圆的呢？", "url": "https://daily.zhihu.com/story/9779237"},
23 | {"title": "18禁恋爱老婆来到三次元！一见面竟被作者做这样的事情？", "url": "https://www.jianshu.com/p/ca32a84e3861"}
24 | ]


--------------------------------------------------------------------------------
/spider_demo/demo/scrapy.cfg:
--------------------------------------------------------------------------------
 1 | # Automatically created by: scrapy startproject
 2 | #
 3 | # For more information about the [deploy] section see:
 4 | # https://scrapyd.readthedocs.io/en/latest/deploy.html
 5 | 
 6 | [settings]
 7 | default = demo.settings
 8 | 
 9 | [deploy]
10 | #url = http://localhost:6800/
11 | project = demo
12 | 


--------------------------------------------------------------------------------
/static/bootstrap/bootstrap-icons.woff:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/bootstrap/bootstrap-icons.woff


--------------------------------------------------------------------------------
/static/bootstrap/bootstrap-icons.woff2:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/bootstrap/bootstrap-icons.woff2


--------------------------------------------------------------------------------
/static/imgs/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/favicon.ico


--------------------------------------------------------------------------------
/static/imgs/friends/learnspider_logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/friends/learnspider_logo.png


--------------------------------------------------------------------------------
/static/imgs/friends/stardream_logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/friends/stardream_logo.png


--------------------------------------------------------------------------------
/static/imgs/logo.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/logo.jpeg


--------------------------------------------------------------------------------
/static/imgs/sandbox/blog.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sandbox/blog.jpeg


--------------------------------------------------------------------------------
/static/imgs/sandbox/music.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sandbox/music.jpeg


--------------------------------------------------------------------------------
/static/imgs/sandbox/news.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sandbox/news.jpeg


--------------------------------------------------------------------------------
/static/imgs/sandbox/shop.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sandbox/shop.jpeg


--------------------------------------------------------------------------------
/static/imgs/sandbox/video.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sandbox/video.jpeg


--------------------------------------------------------------------------------
/static/imgs/sandbox/wallpaper.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sandbox/wallpaper.jpeg


--------------------------------------------------------------------------------
/static/imgs/setu/1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/setu/1.jpg


--------------------------------------------------------------------------------
/static/imgs/setu/1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/setu/1.png


--------------------------------------------------------------------------------
/static/imgs/setu/2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/setu/2.jpg


--------------------------------------------------------------------------------
/static/imgs/setu/2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/setu/2.png


--------------------------------------------------------------------------------
/static/imgs/setu/3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/setu/3.jpg


--------------------------------------------------------------------------------
/static/imgs/setu/3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/setu/3.png


--------------------------------------------------------------------------------
/static/imgs/sponsors/evolution_host.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sponsors/evolution_host.png


--------------------------------------------------------------------------------
/static/imgs/sponsors/lky_logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sponsors/lky_logo.png


--------------------------------------------------------------------------------
/static/imgs/sponsors/qgwl_logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sponsors/qgwl_logo.png


--------------------------------------------------------------------------------
/static/imgs/sponsors/yrx_logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/sponsors/yrx_logo.png


--------------------------------------------------------------------------------
/static/imgs/support/lky.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/support/lky.png


--------------------------------------------------------------------------------
/static/imgs/support/wx.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/support/wx.jpg


--------------------------------------------------------------------------------
/static/imgs/support/yrx.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/support/yrx.png


--------------------------------------------------------------------------------
/static/imgs/support/zfb.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/static/imgs/support/zfb.jpg


--------------------------------------------------------------------------------
/static/js/cpython666.js:
--------------------------------------------------------------------------------
 1 | console.log(
 2 | `
 3 |                          _     _                         __      __      __  
 4 |                         | |   | |                       / /     / /     / /  
 5 |    ___   _ __    _   _  | |_  | |__     ___    _ __    / /_    / /_    / /_  
 6 |   / __| | '_ \\  | | | | | __| | '_ \\   / _ \\  | '_ \\  | '_ \\  | '_ \\  | '_ \\ 
 7 |  | (__  | |_) | | |_| | | |_  | | | | | (_) | | | | | | (_) | | (_) | | (_) |
 8 |   \\___| | .__/   \\__, |  \\__| |_| |_|  \\___/  |_| |_|  \\___/   \\___/   \\___/ 
 9 |         | |       __/ |                                                      
10 |         |_|      |___/                                                       
11 | `);
12 | console.log('访问我的博客：https://cpython666.github.io/');
13 | console.log('访问我的博客：https://stardreamfly.github.io/');


--------------------------------------------------------------------------------
/tasks.py:
--------------------------------------------------------------------------------
 1 | from invoke import task
 2 | 
 3 | 
 4 | @task
 5 | def up(c):
 6 |     c.run("docker compose up -d --build")
 7 | 
 8 | 
 9 | @task
10 | def b(c):
11 |     c.run("black .")
12 | 
13 | 
14 | @task
15 | def makemigrations(c):
16 |     c.run("python manage.py makemigrations")
17 | 
18 | 
19 | @task(pre=[makemigrations])
20 | def m(c):
21 |     c.run("python manage.py migrate")
22 | 
23 |     print("运行迁移命令")
24 | 


--------------------------------------------------------------------------------
/test/demo.py:
--------------------------------------------------------------------------------
1 | import requests
2 | 
3 | # res=requests.get('https://www.whu.edu.cn/')
4 | res = requests.get("http://localhost:8001/view/encode/")
5 | # res=requests.get('http://localhost:8001/demo1/')
6 | print(res.text)
7 | print(res.encoding)
8 | 


--------------------------------------------------------------------------------
/test/dp.py:
--------------------------------------------------------------------------------
1 | from DrissionPage import ChromiumPage
2 | 
3 | page = ChromiumPage()
4 | page.get("http://localhost:8001/view/request-twice/")
5 | print(page.html)
6 | page.quit()
7 | 


--------------------------------------------------------------------------------
/topics/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/__init__.py


--------------------------------------------------------------------------------
/topics/admin.py:
--------------------------------------------------------------------------------
 1 | from django.contrib import admin
 2 | from .models import Topics
 3 | 
 4 | 
 5 | class TopicsAdmin(admin.ModelAdmin):
 6 |     list_display = ("title", "order_id", "category", "difficulty", "pass_status")
 7 |     list_editable = ("order_id",)  # 允许在列表中编辑 order_id
 8 | 
 9 | 
10 | admin.site.register(Topics, TopicsAdmin)
11 | 


--------------------------------------------------------------------------------
/topics/apps.py:
--------------------------------------------------------------------------------
 1 | from django.apps import AppConfig
 2 | 
 3 | 
 4 | class TopicsConfig(AppConfig):
 5 |     default_auto_field = "django.db.models.BigAutoField"
 6 |     name = "topics"
 7 | 
 8 |     def ready(self):
 9 |         from topics.scheduler import start_scheduler
10 |         from LearnSpider.settings import DJANGO_ENV
11 | 
12 |         # if DJANGO_ENV != "local":
13 |         #     start_scheduler()
14 |         start_scheduler()
15 | 


--------------------------------------------------------------------------------
/topics/decorators.py:
--------------------------------------------------------------------------------
 1 | from django.http import JsonResponse
 2 | 
 3 | 
 4 | def require_ua(view_func):
 5 |     def _wrapped_view(request, *args, **kwargs):
 6 |         user_agent = request.META.get("HTTP_USER_AGENT")
 7 |         if not user_agent:
 8 |             return JsonResponse({"error": "User-Agent header is required"}, status=400)
 9 |         return view_func(request, *args, **kwargs)
10 | 
11 |     return _wrapped_view
12 | 


--------------------------------------------------------------------------------
/topics/management/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/management/__init__.py


--------------------------------------------------------------------------------
/topics/management/commands/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/management/commands/__init__.py


--------------------------------------------------------------------------------
/topics/management/commands/fetch_news_data.py:
--------------------------------------------------------------------------------
 1 | from django.core.management.base import BaseCommand
 2 | from topics.tasks import fetch_and_save_news
 3 | 
 4 | 
 5 | # python manage.py fetch_news_data
 6 | class Command(BaseCommand):
 7 |     help = "采集一批热点新闻"
 8 | 
 9 |     def handle(self, *args, **kwargs):
10 |         fetch_and_save_news()
11 | 


--------------------------------------------------------------------------------
/topics/management/commands/fetch_news_web3.py:
--------------------------------------------------------------------------------
 1 | from django.core.management.base import BaseCommand
 2 | from collect_data.collect_news_binance import BianNewsSpider
 3 | 
 4 | 
 5 | # python manage.py fetch_news_web3
 6 | class Command(BaseCommand):
 7 |     help = "批量更新题目的 category，规范化 category"
 8 | 
 9 |     def handle(self, *args, **kwargs):
10 |         spider = BianNewsSpider()
11 |         print(spider.id_info_mapping)
12 |         # spider.fetch_new_by_tag()
13 | 


--------------------------------------------------------------------------------
/topics/management/commands/update_category.py:
--------------------------------------------------------------------------------
 1 | from django.core.management.base import BaseCommand
 2 | from topics.models import Topics
 3 | 
 4 | 
 5 | # python manage.py update_category
 6 | class Command(BaseCommand):
 7 |     help = "批量更新题目的 category，规范化 category"
 8 | 
 9 |     def handle(self, *args, **kwargs):
10 |         questions = Topics.objects.all()
11 |         for question in questions:
12 |             if question.category:
13 |                 question.category = "，".join(
14 |                     question.category.replace(",", "，")
15 |                     .replace("；", "，")
16 |                     .replace(";", "，")
17 |                     .split("，")
18 |                 )
19 |                 question.save()
20 |         self.stdout.write(self.style.SUCCESS("已成功规范化 category 字段"))
21 | 


--------------------------------------------------------------------------------
/topics/management/commands/update_difficulty_scores.py:
--------------------------------------------------------------------------------
 1 | from django.core.management.base import BaseCommand
 2 | from topics.models import Topics
 3 | 
 4 | 
 5 | # python manage.py update_difficulty_scores
 6 | class Command(BaseCommand):
 7 |     help = "批量更新题目的 difficulty_score 字段，规则为目前的 difficulty_score 排序号乘以 10"
 8 | 
 9 |     def handle(self, *args, **kwargs):
10 |         questions = Topics.objects.all().order_by("difficulty_score")
11 |         for idx, question in enumerate(questions):
12 |             question.difficulty_score = (idx + 1) * 10
13 |             question.save()
14 |         self.stdout.write(self.style.SUCCESS("Successfully updated difficulty_scores"))
15 | 


--------------------------------------------------------------------------------
/topics/management/commands/update_order_ids.py:
--------------------------------------------------------------------------------
 1 | from django.core.management.base import BaseCommand
 2 | from topics.models import Topics
 3 | 
 4 | 
 5 | # python manage.py update_order_ids
 6 | class Command(BaseCommand):
 7 |     help = "批量更新题目的 order_id，根绝题目的 order_id 排序好乘以 10"
 8 | 
 9 |     def handle(self, *args, **kwargs):
10 |         questions = Topics.objects.all().order_by("order_id")
11 |         for idx, question in enumerate(questions):
12 |             question.order_id = (idx + 1) * 10
13 |             question.save()
14 |         self.stdout.write(self.style.SUCCESS("已成功更新 order_ids"))
15 | 


--------------------------------------------------------------------------------
/topics/management/commands/update_pass_status.py:
--------------------------------------------------------------------------------
 1 | # api/management/commands/update_pass_status.py
 2 | 
 3 | from django.core.management.base import BaseCommand
 4 | from topics.models import Topics
 5 | 
 6 | 
 7 | class Command(BaseCommand):
 8 |     help = "批量更新题目的 pass_status 字段为 false"
 9 | 
10 |     def handle(self, *args, **kwargs):
11 |         updated_count = Topics.objects.update(pass_status=False)
12 |         self.stdout.write(
13 |             self.style.SUCCESS(
14 |                 f"Successfully updated pass_status for {updated_count} topics"
15 |             )
16 |         )
17 | 


--------------------------------------------------------------------------------
/topics/migrations/0001_initial.py:
--------------------------------------------------------------------------------
  1 | # Generated by Django 5.0.7 on 2025-02-16 17:02
  2 | 
  3 | import django.db.models.deletion
  4 | from django.db import migrations, models
  5 | 
  6 | 
  7 | class Migration(migrations.Migration):
  8 | 
  9 |     initial = True
 10 | 
 11 |     dependencies = []
 12 | 
 13 |     operations = [
 14 |         migrations.CreateModel(
 15 |             name="Category",
 16 |             fields=[
 17 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
 18 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
 19 |                 ("id", models.AutoField(primary_key=True, serialize=False)),
 20 |                 (
 21 |                     "name",
 22 |                     models.CharField(
 23 |                         blank=True, help_text="类别名", max_length=200, null=True
 24 |                     ),
 25 |                 ),
 26 |                 (
 27 |                     "detail",
 28 |                     models.CharField(
 29 |                         blank=True,
 30 |                         default=None,
 31 |                         help_text="类别的描述",
 32 |                         max_length=200,
 33 |                         null=True,
 34 |                     ),
 35 |                 ),
 36 |             ],
 37 |             options={
 38 |                 "db_table": "sd_ls_category",
 39 |             },
 40 |         ),
 41 |         migrations.CreateModel(
 42 |             name="NewsCategory",
 43 |             fields=[
 44 |                 (
 45 |                     "id",
 46 |                     models.BigAutoField(
 47 |                         auto_created=True,
 48 |                         primary_key=True,
 49 |                         serialize=False,
 50 |                         verbose_name="ID",
 51 |                     ),
 52 |                 ),
 53 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
 54 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
 55 |                 ("name", models.CharField(max_length=100)),
 56 |                 ("slug", models.CharField(max_length=255, unique=True)),
 57 |                 ("description", models.TextField(blank=True, null=True)),
 58 |             ],
 59 |             options={
 60 |                 "db_table": "sd_ls_news_category",
 61 |             },
 62 |         ),
 63 |         migrations.CreateModel(
 64 |             name="NewsPlatform",
 65 |             fields=[
 66 |                 (
 67 |                     "id",
 68 |                     models.BigAutoField(
 69 |                         auto_created=True,
 70 |                         primary_key=True,
 71 |                         serialize=False,
 72 |                         verbose_name="ID",
 73 |                     ),
 74 |                 ),
 75 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
 76 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
 77 |                 ("name", models.CharField(max_length=100)),
 78 |                 ("slug", models.SlugField(unique=True)),
 79 |                 (
 80 |                     "description",
 81 |                     models.CharField(blank=True, max_length=255, null=True),
 82 |                 ),
 83 |             ],
 84 |             options={
 85 |                 "db_table": "sd_ls_news_platform",
 86 |             },
 87 |         ),
 88 |         migrations.CreateModel(
 89 |             name="Topics",
 90 |             fields=[
 91 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
 92 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
 93 |                 ("id", models.AutoField(primary_key=True, serialize=False)),
 94 |                 (
 95 |                     "order_id",
 96 |                     models.PositiveIntegerField(
 97 |                         blank=True,
 98 |                         default=3,
 99 |                         help_text="题目排序，根据难度分排序，会变",
100 |                         null=True,
101 |                     ),
102 |                 ),
103 |                 (
104 |                     "title",
105 |                     models.CharField(
106 |                         blank=True,
107 |                         default=None,
108 |                         help_text="题目的标题，最好有趣个性化一点",
109 |                         max_length=200,
110 |                     ),
111 |                 ),
112 |                 (
113 |                     "detail",
114 |                     models.TextField(
115 |                         blank=True,
116 |                         default="暂无表述",
117 |                         help_text="题目的描述：简单创造一个背景故事",
118 |                         null=True,
119 |                     ),
120 |                 ),
121 |                 (
122 |                     "goal",
123 |                     models.TextField(
124 |                         blank=True,
125 |                         default="暂无描述",
126 |                         help_text="题目的目标：掌握xxx",
127 |                         null=True,
128 |                     ),
129 |                 ),
130 |                 (
131 |                     "question",
132 |                     models.TextField(
133 |                         blank=True,
134 |                         default="暂无题目要求",
135 |                         help_text="题目要求",
136 |                         null=True,
137 |                     ),
138 |                 ),
139 |                 (
140 |                     "answer",
141 |                     models.CharField(
142 |                         blank=True, help_text="题目的答案", max_length=255, null=True
143 |                     ),
144 |                 ),
145 |                 (
146 |                     "category",
147 |                     models.CharField(
148 |                         blank=True,
149 |                         default="成神之路",
150 |                         help_text="题目类别：成神之路，xpath特训",
151 |                         max_length=100,
152 |                         null=True,
153 |                     ),
154 |                 ),
155 |                 (
156 |                     "difficulty",
157 |                     models.CharField(
158 |                         blank=True,
159 |                         choices=[
160 |                             ("beginner", "初级"),
161 |                             ("intermediate", "中级"),
162 |                             ("advanced", "高级"),
163 |                             ("ultimate", "终极"),
164 |                         ],
165 |                         default="简单",
166 |                         help_text="难度",
167 |                         max_length=12,
168 |                         null=True,
169 |                     ),
170 |                 ),
171 |                 (
172 |                     "difficulty_score",
173 |                     models.BigIntegerField(
174 |                         blank=True,
175 |                         default=200,
176 |                         help_text="难度分数，后续根据此字段排序order_id",
177 |                         null=True,
178 |                     ),
179 |                 ),
180 |                 (
181 |                     "points",
182 |                     models.TextField(
183 |                         blank=True,
184 |                         default="暂未更新考点",
185 |                         help_text="本题的考点",
186 |                         null=True,
187 |                     ),
188 |                 ),
189 |                 (
190 |                     "published",
191 |                     models.BooleanField(
192 |                         blank=True, default=False, help_text="是否发布", null=True
193 |                     ),
194 |                 ),
195 |                 (
196 |                     "pass_status",
197 |                     models.BooleanField(
198 |                         blank=True, default=False, help_text="是否通过", null=True
199 |                     ),
200 |                 ),
201 |                 (
202 |                     "solution_txt",
203 |                     models.URLField(
204 |                         blank=True,
205 |                         default="暂无表述",
206 |                         help_text="题解，图文讲解",
207 |                         null=True,
208 |                     ),
209 |                 ),
210 |                 (
211 |                     "solution_video",
212 |                     models.URLField(
213 |                         blank=True, default="暂无表述", help_text="视频讲解", null=True
214 |                     ),
215 |                 ),
216 |                 (
217 |                     "api_type",
218 |                     models.CharField(
219 |                         blank=True,
220 |                         default="直接对应视图",
221 |                         help_text="此题目的接口类型：直接对应视图，访问一个接口判断后决定是否返回视图，返回一个视图+【多个】api",
222 |                         max_length=255,
223 |                         null=True,
224 |                     ),
225 |                 ),
226 |                 (
227 |                     "api_prefix",
228 |                     models.CharField(
229 |                         blank=True,
230 |                         default="topic/",
231 |                         help_text="topic/,view/,api/",
232 |                         max_length=255,
233 |                         null=True,
234 |                     ),
235 |                 ),
236 |                 (
237 |                     "response_path",
238 |                     models.TextField(
239 |                         blank=True, help_text="题目路径【文件名】", null=True
240 |                     ),
241 |                 ),
242 |             ],
243 |             options={
244 |                 "db_table": "sd_ls_topic",
245 |                 "ordering": ["order_id"],
246 |             },
247 |         ),
248 |         migrations.CreateModel(
249 |             name="News",
250 |             fields=[
251 |                 (
252 |                     "id",
253 |                     models.BigAutoField(
254 |                         auto_created=True,
255 |                         primary_key=True,
256 |                         serialize=False,
257 |                         verbose_name="ID",
258 |                     ),
259 |                 ),
260 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
261 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
262 |                 ("title", models.CharField(max_length=200)),
263 |                 (
264 |                     "url",
265 |                     models.CharField(
266 |                         blank=True, max_length=255, null=True, unique=True
267 |                     ),
268 |                 ),
269 |                 ("desc", models.CharField(blank=True, max_length=500, null=True)),
270 |                 ("publish_time", models.DateTimeField(blank=True, null=True)),
271 |                 ("timestamp", models.BigIntegerField(blank=True, default=0, null=True)),
272 |                 ("author", models.CharField(blank=True, max_length=255, null=True)),
273 |                 ("content", models.TextField()),
274 |                 ("hot", models.IntegerField(default=0)),
275 |                 (
276 |                     "category",
277 |                     models.ForeignKey(
278 |                         blank=True,
279 |                         null=True,
280 |                         on_delete=django.db.models.deletion.CASCADE,
281 |                         related_name="news",
282 |                         to="topics.newscategory",
283 |                     ),
284 |                 ),
285 |                 (
286 |                     "platform",
287 |                     models.ForeignKey(
288 |                         blank=True,
289 |                         null=True,
290 |                         on_delete=django.db.models.deletion.CASCADE,
291 |                         related_name="news",
292 |                         to="topics.newsplatform",
293 |                     ),
294 |                 ),
295 |             ],
296 |             options={
297 |                 "db_table": "sd_ls_news",
298 |             },
299 |         ),
300 |         migrations.CreateModel(
301 |             name="NewsRequestHistory",
302 |             fields=[
303 |                 (
304 |                     "id",
305 |                     models.BigAutoField(
306 |                         auto_created=True,
307 |                         primary_key=True,
308 |                         serialize=False,
309 |                         verbose_name="ID",
310 |                     ),
311 |                 ),
312 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
313 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
314 |                 ("request_time", models.DateTimeField(auto_now_add=True)),
315 |                 ("response_data", models.JSONField()),
316 |                 ("status", models.CharField(blank=True, max_length=255, null=True)),
317 |                 (
318 |                     "platform",
319 |                     models.ForeignKey(
320 |                         on_delete=django.db.models.deletion.CASCADE,
321 |                         related_name="history",
322 |                         to="topics.newsplatform",
323 |                     ),
324 |                 ),
325 |             ],
326 |             options={
327 |                 "db_table": "sd_ls_news_request_history",
328 |             },
329 |         ),
330 |         migrations.CreateModel(
331 |             name="TopicCategoryRelation",
332 |             fields=[
333 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
334 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
335 |                 (
336 |                     "display_order",
337 |                     models.PositiveIntegerField(blank=True, default=100, null=True),
338 |                 ),
339 |                 ("id", models.AutoField(primary_key=True, serialize=False)),
340 |                 (
341 |                     "category",
342 |                     models.ForeignKey(
343 |                         on_delete=django.db.models.deletion.CASCADE,
344 |                         to="topics.category",
345 |                     ),
346 |                 ),
347 |                 (
348 |                     "topic",
349 |                     models.ForeignKey(
350 |                         on_delete=django.db.models.deletion.CASCADE, to="topics.topics"
351 |                     ),
352 |                 ),
353 |             ],
354 |             options={
355 |                 "db_table": "sd_ls_topic_category_relation",
356 |                 "unique_together": {("topic", "category")},
357 |             },
358 |         ),
359 |     ]
360 | 


--------------------------------------------------------------------------------
/topics/migrations/0002_web3newstag.py:
--------------------------------------------------------------------------------
 1 | # Generated by Django 5.0.7 on 2025-02-27 15:25
 2 | 
 3 | from django.db import migrations, models
 4 | 
 5 | 
 6 | class Migration(migrations.Migration):
 7 | 
 8 |     dependencies = [
 9 |         ("topics", "0001_initial"),
10 |     ]
11 | 
12 |     operations = [
13 |         migrations.CreateModel(
14 |             name="Web3NewsTag",
15 |             fields=[
16 |                 (
17 |                     "id",
18 |                     models.BigAutoField(
19 |                         auto_created=True,
20 |                         primary_key=True,
21 |                         serialize=False,
22 |                         verbose_name="ID",
23 |                     ),
24 |                 ),
25 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
26 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
27 |                 ("name", models.CharField(max_length=200)),
28 |                 ("tag", models.CharField(max_length=200)),
29 |                 ("name_en", models.CharField(max_length=200)),
30 |                 ("url", models.CharField(blank=True, max_length=255, null=True)),
31 |                 ("desc", models.CharField(blank=True, max_length=500, null=True)),
32 |                 ("desc_en", models.CharField(blank=True, max_length=500, null=True)),
33 |             ],
34 |             options={
35 |                 "db_table": "sd_ls_news_web3_tags",
36 |             },
37 |         ),
38 |     ]
39 | 


--------------------------------------------------------------------------------
/topics/migrations/0003_web3news_web3newstag_tag_id_alter_web3newstag_name_and_more.py:
--------------------------------------------------------------------------------
 1 | # Generated by Django 5.0.7 on 2025-02-27 16:06
 2 | 
 3 | from django.db import migrations, models
 4 | 
 5 | 
 6 | class Migration(migrations.Migration):
 7 | 
 8 |     dependencies = [
 9 |         ("topics", "0002_web3newstag"),
10 |     ]
11 | 
12 |     operations = [
13 |         migrations.CreateModel(
14 |             name="Web3News",
15 |             fields=[
16 |                 (
17 |                     "id",
18 |                     models.BigAutoField(
19 |                         auto_created=True,
20 |                         primary_key=True,
21 |                         serialize=False,
22 |                         verbose_name="ID",
23 |                     ),
24 |                 ),
25 |                 ("created_at", models.DateTimeField(auto_now_add=True, null=True)),
26 |                 ("updated_at", models.DateTimeField(auto_now=True, null=True)),
27 |                 ("title", models.CharField(blank=True, max_length=200, null=True)),
28 |                 ("sub_title", models.CharField(blank=True, max_length=500, null=True)),
29 |                 (
30 |                     "web_link",
31 |                     models.CharField(
32 |                         blank=True, max_length=255, null=True, unique=True
33 |                     ),
34 |                 ),
35 |                 ("author_name", models.CharField(blank=True, max_length=50, null=True)),
36 |                 ("published_time", models.DateTimeField(blank=True, null=True)),
37 |             ],
38 |             options={
39 |                 "db_table": "sd_ls_news_web3",
40 |             },
41 |         ),
42 |         migrations.AddField(
43 |             model_name="web3newstag",
44 |             name="tag_id",
45 |             field=models.IntegerField(blank=True, null=True),
46 |         ),
47 |         migrations.AlterField(
48 |             model_name="web3newstag",
49 |             name="name",
50 |             field=models.CharField(blank=True, max_length=200, null=True),
51 |         ),
52 |         migrations.AlterField(
53 |             model_name="web3newstag",
54 |             name="name_en",
55 |             field=models.CharField(blank=True, max_length=200, null=True),
56 |         ),
57 |         migrations.AlterField(
58 |             model_name="web3newstag",
59 |             name="tag",
60 |             field=models.CharField(blank=True, max_length=200, null=True),
61 |         ),
62 |     ]
63 | 


--------------------------------------------------------------------------------
/topics/migrations/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/migrations/__init__.py


--------------------------------------------------------------------------------
/topics/models.py:
--------------------------------------------------------------------------------
  1 | from django.db import models
  2 | import json
  3 | 
  4 | 
  5 | class BaseModel(models.Model):
  6 |     created_at = models.DateTimeField(
  7 |         auto_now_add=True, null=True, blank=True
  8 |     )  # 创建时间
  9 |     updated_at = models.DateTimeField(auto_now=True, null=True, blank=True)  # 修改时间
 10 | 
 11 |     class Meta:
 12 |         abstract = True
 13 | 
 14 | 
 15 | class OrderMixin(models.Model):
 16 |     display_order = models.PositiveIntegerField(
 17 |         blank=True, null=True, default=100
 18 |     )  # 记录显示顺序
 19 | 
 20 |     class Meta:
 21 |         abstract = True
 22 | 
 23 | 
 24 | class Category(BaseModel):
 25 |     id = models.AutoField(primary_key=True)
 26 |     name = models.CharField(blank=True, null=True, max_length=200, help_text="类别名")
 27 |     detail = models.CharField(
 28 |         blank=True, null=True, default=None, max_length=200, help_text="类别的描述"
 29 |     )
 30 | 
 31 |     class Meta:
 32 |         db_table = "sd_ls_category"  # 自定义表名
 33 | 
 34 | 
 35 | class Topics(BaseModel):
 36 |     DIFFICULTY_CHOICES = [
 37 |         ("beginner", "初级"),
 38 |         ("intermediate", "中级"),
 39 |         ("advanced", "高级"),
 40 |         ("ultimate", "终极"),
 41 |     ]
 42 | 
 43 |     id = models.AutoField(primary_key=True)
 44 |     order_id = models.PositiveIntegerField(
 45 |         blank=True, null=True, default=3, help_text="题目排序，根据难度分排序，会变"
 46 |     )
 47 |     title = models.CharField(
 48 |         blank=True,
 49 |         default=None,
 50 |         max_length=200,
 51 |         help_text="题目的标题，最好有趣个性化一点",
 52 |     )
 53 |     detail = models.TextField(
 54 |         blank=True,
 55 |         null=True,
 56 |         default="暂无表述",
 57 |         help_text="题目的描述：简单创造一个背景故事",
 58 |     )
 59 |     goal = models.TextField(
 60 |         blank=True, null=True, default="暂无描述", help_text="题目的目标：掌握xxx"
 61 |     )
 62 |     question = models.TextField(
 63 |         blank=True, null=True, default="暂无题目要求", help_text="题目要求"
 64 |     )
 65 |     answer = models.CharField(
 66 |         blank=True, null=True, max_length=255, help_text="题目的答案"
 67 |     )
 68 |     category = models.CharField(
 69 |         blank=True,
 70 |         null=True,
 71 |         default="成神之路",
 72 |         max_length=100,
 73 |         help_text="题目类别：成神之路，xpath特训",
 74 |     )
 75 |     difficulty = models.CharField(
 76 |         blank=True,
 77 |         null=True,
 78 |         default="简单",
 79 |         max_length=12,
 80 |         choices=DIFFICULTY_CHOICES,
 81 |         help_text="难度",
 82 |     )
 83 |     difficulty_score = models.BigIntegerField(
 84 |         blank=True,
 85 |         null=True,
 86 |         default=200,
 87 |         help_text="难度分数，后续根据此字段排序order_id",
 88 |     )
 89 |     points = models.TextField(
 90 |         blank=True,
 91 |         null=True,
 92 |         default="暂未更新考点",
 93 |         help_text="本题的考点",
 94 |     )
 95 |     published = models.BooleanField(
 96 |         blank=True, null=True, default=False, help_text="是否发布"
 97 |     )
 98 |     pass_status = models.BooleanField(
 99 |         blank=True, null=True, default=False, help_text="是否通过"
100 |     )
101 |     solution_txt = models.URLField(
102 |         blank=True, null=True, default="暂无表述", help_text="题解，图文讲解"
103 |     )
104 |     solution_video = models.URLField(
105 |         blank=True, null=True, default="暂无表述", help_text="视频讲解"
106 |     )
107 |     api_type = models.CharField(
108 |         blank=True,
109 |         null=True,
110 |         max_length=255,
111 |         default="直接对应视图",
112 |         help_text="此题目的接口类型：直接对应视图，访问一个接口判断后决定是否返回视图，返回一个视图+【多个】api",
113 |     )
114 |     api_prefix = models.CharField(
115 |         blank=True,
116 |         null=True,
117 |         max_length=255,
118 |         default="topic/",
119 |         help_text="topic/,view/,api/",
120 |     )
121 |     response_path = models.TextField(
122 |         blank=True, null=True, help_text="题目路径【文件名】"
123 |     )
124 | 
125 |     class Meta:
126 |         db_table = "sd_ls_topic"  # 自定义表名
127 |         ordering = ["order_id"]  # 默认按 order_id 排序
128 | 
129 |     def __str__(self):
130 |         return self.title
131 | 
132 | 
133 | # 题目与 Category 的中间表
134 | class TopicCategoryRelation(BaseModel, OrderMixin):
135 |     id = models.AutoField(primary_key=True)
136 | 
137 |     topic = models.ForeignKey(Topics, on_delete=models.CASCADE)
138 |     category = models.ForeignKey(Category, on_delete=models.CASCADE)
139 | 
140 |     class Meta:
141 |         db_table = "sd_ls_topic_category_relation"  # 自定义表名
142 |         unique_together = ("topic", "category")  # 确保唯一关系
143 | 
144 |     def __str__(self):
145 |         return f"Topic {self.topic_id} - Category {self.category_id}"
146 | 
147 | 
148 | # 平台表
149 | class NewsPlatform(BaseModel):
150 |     name = models.CharField(max_length=100)  # 平台名称
151 |     slug = models.SlugField(unique=True)  # 用于URL的标识符
152 |     description = models.CharField(blank=True, null=True, max_length=255)  # 平台简介
153 | 
154 |     class Meta:
155 |         db_table = "sd_ls_news_platform"
156 | 
157 |     def __str__(self):
158 |         return self.name
159 | 
160 | 
161 | # 新闻类别表
162 | class NewsCategory(BaseModel):
163 |     name = models.CharField(max_length=100)  # 类别名称
164 |     slug = models.CharField(unique=True, max_length=255)  # 用于URL的标识符
165 |     description = models.TextField(blank=True, null=True)  # 类别简介
166 | 
167 |     class Meta:
168 |         db_table = "sd_ls_news_category"
169 | 
170 |     def __str__(self):
171 |         return self.name
172 | 
173 | 
174 | class NewsRequestHistory(BaseModel):
175 |     request_time = models.DateTimeField(auto_now_add=True)
176 |     response_data = models.JSONField()  # 处理后的结果数据
177 |     status = models.CharField(blank=True, null=True, max_length=255)
178 |     platform = models.ForeignKey(
179 |         NewsPlatform, related_name="history", on_delete=models.CASCADE
180 |     )  # 所属平台
181 | 
182 |     class Meta:
183 |         db_table = "sd_ls_news_request_history"
184 | 
185 |     def __str__(self):
186 |         return f"Request at {self.request_time}"
187 | 
188 | 
189 | # 新闻表
190 | class News(BaseModel):
191 |     title = models.CharField(max_length=200)  # 新闻标题
192 |     url = models.CharField(
193 |         blank=True, null=True, unique=True, max_length=255
194 |     )  # 新闻链接
195 |     desc = models.CharField(max_length=500, blank=True, null=True)
196 |     publish_time = models.DateTimeField(blank=True, null=True)
197 |     timestamp = models.BigIntegerField(default=0, blank=True, null=True)
198 |     author = models.CharField(max_length=255, blank=True, null=True)
199 |     content = models.TextField()  # 新闻内容
200 |     hot = models.IntegerField(default=0)  # 新闻内容
201 |     platform = models.ForeignKey(
202 |         NewsPlatform,
203 |         related_name="news",
204 |         on_delete=models.CASCADE,
205 |         blank=True,
206 |         null=True,
207 |     )  # 所属平台
208 |     category = models.ForeignKey(
209 |         NewsCategory,
210 |         related_name="news",
211 |         on_delete=models.CASCADE,
212 |         blank=True,
213 |         null=True,
214 |     )  # 新闻类别
215 | 
216 |     class Meta:
217 |         db_table = "sd_ls_news"
218 | 
219 |     def __str__(self):
220 |         return self.title
221 | 
222 | 
223 | # 新闻表
224 | class Web3NewsTag(BaseModel):
225 |     tag_id = models.IntegerField(blank=True, null=True)
226 |     name = models.CharField(max_length=200, blank=True, null=True)
227 |     tag = models.CharField(max_length=200, blank=True, null=True)
228 |     name_en = models.CharField(max_length=200, blank=True, null=True)
229 |     url = models.CharField(blank=True, null=True, max_length=255)
230 |     desc = models.CharField(max_length=500, blank=True, null=True)
231 |     desc_en = models.CharField(max_length=500, blank=True, null=True)
232 | 
233 |     class Meta:
234 |         db_table = "sd_ls_news_web3_tags"
235 | 
236 |     def __str__(self):
237 |         return self.name
238 | 
239 | 
240 | class Web3News(BaseModel):
241 |     title = models.CharField(max_length=200, blank=True, null=True)
242 |     sub_title = models.CharField(max_length=500, blank=True, null=True)
243 |     web_link = models.CharField(unique=True, max_length=255, blank=True, null=True)
244 |     author_name = models.CharField(max_length=50, blank=True, null=True)
245 |     published_time = models.DateTimeField(blank=True, null=True)
246 | 
247 |     class Meta:
248 |         db_table = "sd_ls_news_web3"
249 | 
250 |     def __str__(self):
251 |         return self.title
252 | 


--------------------------------------------------------------------------------
/topics/scheduler.py:
--------------------------------------------------------------------------------
 1 | # myapp/scheduler.py
 2 | from apscheduler.schedulers.background import BackgroundScheduler
 3 | from apscheduler.triggers.interval import IntervalTrigger
 4 | from apscheduler.triggers.cron import CronTrigger  # 使用 CronTrigger
 5 | from topics.tasks import fetch_and_save_news  # 假设你有任务在 tasks.py 中
 6 | 
 7 | 
 8 | def start_scheduler():
 9 |     scheduler = BackgroundScheduler()
10 |     scheduler.add_job(
11 |         fetch_and_save_news,
12 |         trigger=CronTrigger(
13 |             minute="0,10,20,30,40,50"
14 |         ),  # 每个整十分（00, 10, 20, 30, 40, 50）执行一次
15 |         # trigger=IntervalTrigger(minutes=10),  # 每 10 分钟执行一次
16 |         id="fetch_and_save_news",
17 |         name="定时任务:十分钟一次，获取新闻",
18 |         replace_existing=True,
19 |     )
20 |     scheduler.start()
21 | 


--------------------------------------------------------------------------------
/topics/serializers.py:
--------------------------------------------------------------------------------
 1 | from rest_framework import serializers
 2 | from .models import Topics
 3 | 
 4 | 
 5 | class TopicsSerializer(serializers.ModelSerializer):
 6 |     class Meta:
 7 |         model = Topics
 8 |         fields = "__all__"
 9 | 
10 |     def to_representation(self, instance):
11 |         representation = super().to_representation(instance)
12 |         response_path = representation.get("response_path")
13 |         api_prefix = representation.get("api_prefix")
14 | 
15 |         representation["response_path"] = f"{api_prefix}{response_path}"
16 | 
17 |         # if api_prefix.startswith('url/'):
18 |         #     pass
19 |         # elif response_path:
20 |         #     representation['response_path'] = f"{api_prefix}{response_path}"
21 | 
22 |         return representation
23 | 


--------------------------------------------------------------------------------
/topics/static/topics/css/style.css:
--------------------------------------------------------------------------------
 1 | td, th {
 2 |     white-space: nowrap;
 3 |     overflow: hidden;
 4 |     text-overflow: ellipsis;
 5 |     max-width: 300px;
 6 | }
 7 | 
 8 | td span, th span {
 9 |     display: inline-block;
10 |     max-width: 100%;
11 |     white-space: nowrap;
12 |     overflow: hidden;
13 |     text-overflow: ellipsis;
14 | }
15 | 
16 | .table-container {
17 |     display: flex;
18 |     overflow-x: auto;
19 | }
20 | 
21 | .fixed-column {
22 |     position: sticky;
23 |     left: 0;
24 |     z-index: 1;
25 | }
26 | 
27 | #data-body-fixed,thead{
28 |     border-right: 2px solid #ffffff !important; /* 添加右侧边框 */
29 | 
30 | }


--------------------------------------------------------------------------------
/topics/tasks.py:
--------------------------------------------------------------------------------
 1 | # myapp/tasks.py
 2 | from collect_data.collect_news import get_all_platforms, fetch_platform_news
 3 | from topics.models import News, NewsPlatform, NewsRequestHistory
 4 | from time import sleep
 5 | 
 6 | 
 7 | def fetch_and_save_news():
 8 |     for platform_slug in get_all_platforms():
 9 |         platform = NewsPlatform.objects.get(slug=platform_slug)
10 |         print(f"采集{platform.name} {platform.slug}中...")
11 |         data = fetch_platform_news(platform.slug)
12 |         if data:
13 |             for item in data:
14 |                 try:
15 |                     item = item | {"platform": platform}
16 |                     News.objects.create(**item)
17 |                 except Exception as e:
18 |                     continue
19 |             NewsRequestHistory.objects.create(response_data=data, platform=platform)
20 |             # 检查记录数量，如果超过100，则删除前50条
21 |             total=NewsRequestHistory.objects.count()
22 |             print(f'记录数量:{total}')
23 |             if total > 100:
24 |                 # 获取最新的 50 条记录的 ID
25 |                 preserve_ids = list(NewsRequestHistory.objects.all().order_by("-id")[:100].values_list("id", flat=True))
26 |                 # 删除不在这些 ID 中的记录
27 |                 NewsRequestHistory.objects.exclude(id__in=preserve_ids).delete()
28 |             print(f"{platform.name} {platform.slug} 保存完成")
29 |         else:
30 |             print(f"请求出错了！")
31 |         sleep(1)
32 | 


--------------------------------------------------------------------------------
/topics/templates/topics/404.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | 
 4 | {% block content %}
 5 | 
 6 |     <div class="alert alert-warning" role="alert">
 7 | <span class="h1">404</span>
 8 | </div>
 9 | <div class="text-center">
10 | <img src="{% static 'imgs/404.svg' %}" class="rounded img-thumbnail" style="width: 500px" alt="找不到你想要的页面了～">
11 | </div>
12 | {% endblock %}
13 | 


--------------------------------------------------------------------------------
/topics/templates/topics/base.html:
--------------------------------------------------------------------------------
  1 | {% load static %}
  2 | 
  3 | <!DOCTYPE html>
  4 | <html lang="en">
  5 | 
  6 | <head>
  7 | 
  8 |     {% block charset %}
  9 |         <meta charset="UTF-8"> {% endblock %}
 10 | 
 11 |     <meta name="viewport" content="width=device-width, initial-scale=1.0">
 12 |     <title>{% block title %}爬虫百战成神{% endblock %}</title>
 13 |     <link rel="icon" type="image/x-icon" href="{% static 'imgs/favicon.ico' %}"/>
 14 |     <link rel="stylesheet" href="{% static 'topics/css/style.css' %}">
 15 |     <link rel="stylesheet" href="{% static 'bootstrap/bootstrap.min.css' %}">
 16 |     <link rel="stylesheet" href="{% static 'bootstrap/bootstrap-icons.css' %}">
 17 |     <!--    <link href="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0-alpha1/dist/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-GLhlTQ8iRABdZLl6O3oVMWSktQOp6b7In1Zl3/Jr59b6EGGoI1aFkw7cmDA6j6gD" crossorigin="anonymous">-->
 18 |     <script src="{% static 'js/cpython666.js' %}"></script>
 19 |     <script src="{% static 'js/jquery-3.7.1.min.js' %}"></script>
 20 |     <script src="{% static 'js/popper.min.js' %}"></script>
 21 |     <style>
 22 |         /* 自定义背景 */
 23 |         body {
 24 |             background: linear-gradient(to right, #f3f4f7, #ffffff);
 25 |         }
 26 | 
 27 |         /* 卡片标题和文本的阴影效果 */
 28 |         .card-header h3 {
 29 |             text-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);
 30 |         }
 31 | 
 32 |     </style>
 33 | </head>
 34 | 
 35 | <body>
 36 | <header>
 37 |     {% block header %}
 38 |         {% include "topics/header.html" %}
 39 |     {% endblock %}
 40 | </header>
 41 | 
 42 | <div class="container">
 43 | 
 44 |     {% block question %}{% endblock %}
 45 | 
 46 |     {% block answer %}
 47 |         <!-- 通用组件：包含一个输入框和一个提交按钮 -->
 48 |         <div class="container mt-1 mb-1">
 49 |             <h2>提交答案</h2>
 50 |             <form id="answer-form">
 51 |                 <div class="form-group">
 52 |                     <label for="answer">答案</label>
 53 |                     <input type="text" class="form-control" id="answer" required>
 54 |                 </div>
 55 |                 <button type="submit" class="btn btn-primary">提交</button>
 56 |             </form>
 57 |             <div id="result" class="mt-3"></div>
 58 |         </div>
 59 | 
 60 |         <script>
 61 |             document.getElementById('answer-form').addEventListener('submit', function (event) {
 62 |                 event.preventDefault();
 63 | 
 64 |                 // 获取 HTML 的 <title> 标签内容
 65 |                 var questionTitle = document.title.trim();
 66 |                 var answer = document.getElementById('answer').value;
 67 | 
 68 |                 fetch("/api/check-answer/", {
 69 |                     method: 'POST',
 70 |                     headers: {
 71 |                         'Content-Type': 'application/json',
 72 |                     },
 73 |                     body: JSON.stringify({
 74 |                         'question_title': questionTitle,
 75 |                         'answer': answer
 76 |                     })
 77 |                 })
 78 |                     .then(response => response.json())
 79 |                     .then(data => {
 80 |                         var resultDiv = document.getElementById('result');
 81 |                         if (data.correct) {
 82 |                             resultDiv.innerHTML = '<div class="alert alert-success">答案正确！</div>';
 83 |                         } else {
 84 |                             resultDiv.innerHTML = '<div class="alert alert-danger">答案错误，请重试。</div>';
 85 |                         }
 86 |                     })
 87 |                     .catch(error => {
 88 |                         console.error('Error:', error);
 89 |                     });
 90 |             });
 91 |         </script>
 92 |     {% endblock %}
 93 |     {% block content %}{% endblock %}
 94 | </div>
 95 | <script src="{% static 'bootstrap/bootstrap.bundle.min.js' %}"></script>
 96 | <!--    <script src="https://cdn.jsdelivr.net/npm/bootstrap@5.3.0-alpha1/dist/js/bootstrap.bundle.min.js" integrity="sha384-/mhDoLbDldZc3qpsJHpLogda//BVZbgYuw6kof4u2FrCedxOtgRZDTHgHUhOCVim" crossorigin="anonymous"></script>-->
 97 | 
 98 | </body>
 99 | <script>
100 |     {#提示框#}
101 |     var tooltipTriggerList = [].slice.call(document.querySelectorAll('[data-bs-toggle="tooltip"]'))
102 |     var tooltipList = tooltipTriggerList.map(function (tooltipTriggerEl) {
103 |         return new bootstrap.Tooltip(tooltipTriggerEl)
104 |     })
105 |     {#导航点击活跃#}
106 |     document.addEventListener('DOMContentLoaded', (event) => {
107 |         // 获取当前URL路径
108 |         const path = window.location.pathname;
109 | 
110 |         // 获取所有导航链接
111 |         const navLinks = document.querySelectorAll('.nav-link');
112 | 
113 |         // 遍历所有导航链接，检查href是否与当前路径相等
114 |         navLinks.forEach(link => {
115 |             if (link.getAttribute('href') === path) {
116 |                 link.classList.add('active');
117 |             }
118 |         });
119 |     });
120 | </script>
121 | {% block script %}
122 | 
123 | {% endblock %}
124 | </html>


--------------------------------------------------------------------------------
/topics/templates/topics/demo.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}新闻类别{% endblock %}
 4 | {% block answer %}
 5 |     <!-- 你可以在此处添加一些其他的内容或展示区 -->
 6 | {% endblock %}
 7 | {% block content %}
 8 |     <div class="container mt-4">
 9 |         <h1 class="text-center">新闻类别</h1>
10 | 
11 |         <div class="row mt-4">
12 |             <!-- 新闻类别 1 -->
13 |             <div class="col-12 col-md-4 mb-4">
14 |                 <div class="card shadow-sm">
15 |                     <img src="{% static 'imgs/international_news.jpg' %}" class="card-img-top" alt="国际新闻">
16 |                     <div class="card-body">
17 |                         <h5 class="card-title">国际新闻</h5>
18 |                         <p class="card-text">了解全球范围内的新闻热点，聚焦国际局势。</p>
19 |                         <p><strong>来源：</strong>BBC, CNN, Al Jazeera</p>
20 |                         <a href="/news/international" class="btn btn-primary">查看国际新闻</a>
21 |                     </div>
22 |                 </div>
23 |             </div>
24 | 
25 |             <!-- 新闻类别 2 -->
26 |             <div class="col-12 col-md-4 mb-4">
27 |                 <div class="card shadow-sm">
28 |                     <img src="{% static 'imgs/domestic_news.jpg' %}" class="card-img-top" alt="国内新闻">
29 |                     <div class="card-body">
30 |                         <h5 class="card-title">国内新闻</h5>
31 |                         <p class="card-text">关注本国的时事新闻，涵盖社会、政治、经济等各个方面。</p>
32 |                         <p><strong>来源：</strong>新华网, 人民日报, 中国日报</p>
33 |                         <a href="/news/domestic" class="btn btn-primary">查看国内新闻</a>
34 |                     </div>
35 |                 </div>
36 |             </div>
37 | 
38 |             <!-- 新闻类别 3 -->
39 |             <div class="col-12 col-md-4 mb-4">
40 |                 <div class="card shadow-sm">
41 |                     <img src="{% static 'imgs/sports_news.jpg' %}" class="card-img-top" alt="体育新闻">
42 |                     <div class="card-body">
43 |                         <h5 class="card-title">体育新闻</h5>
44 |                         <p class="card-text">关注各类体育赛事、运动员动态及体育评论。</p>
45 |                         <p><strong>来源：</strong>ESPN, 体育日报, FIFA</p>
46 |                         <a href="/news/sports" class="btn btn-primary">查看体育新闻</a>
47 |                     </div>
48 |                 </div>
49 |             </div>
50 | 
51 |             <!-- 新闻类别 4 -->
52 |             <div class="col-12 col-md-4 mb-4">
53 |                 <div class="card shadow-sm">
54 |                     <img src="{% static 'imgs/technology_news.jpg' %}" class="card-img-top" alt="科技新闻">
55 |                     <div class="card-body">
56 |                         <h5 class="card-title">科技新闻</h5>
57 |                         <p class="card-text">报道最新的科技趋势、创新产品、以及技术突破。</p>
58 |                         <p><strong>来源：</strong>TechCrunch, Wired, The Verge</p>
59 |                         <a href="/news/technology" class="btn btn-primary">查看科技新闻</a>
60 |                     </div>
61 |                 </div>
62 |             </div>
63 | 
64 |             <!-- 新闻类别 5 -->
65 |             <div class="col-12 col-md-4 mb-4">
66 |                 <div class="card shadow-sm">
67 |                     <img src="{% static 'imgs/entertainment_news.jpg' %}" class="card-img-top" alt="娱乐新闻">
68 |                     <div class="card-body">
69 |                         <h5 class="card-title">娱乐新闻</h5>
70 |                         <p class="card-text">聚焦电影、电视剧、明星八卦及娱乐圈动态。</p>
71 |                         <p><strong>来源：</strong>娱乐头条, 新浪娱乐, 腾讯娱乐</p>
72 |                         <a href="/news/entertainment" class="btn btn-primary">查看娱乐新闻</a>
73 |                     </div>
74 |                 </div>
75 |             </div>
76 | 
77 |             <!-- 新闻类别 6 -->
78 |             <div class="col-12 col-md-4 mb-4">
79 |                 <div class="card shadow-sm">
80 |                     <img src="{% static 'imgs/business_news.jpg' %}" class="card-img-top" alt="财经新闻">
81 |                     <div class="card-body">
82 |                         <h5 class="card-title">财经新闻</h5>
83 |                         <p class="card-text">提供全球财经新闻，涉及股票、市场、投资等领域。</p>
84 |                         <p><strong>来源：</strong>华尔街日报, 财新网, Bloomberg</p>
85 |                         <a href="/news/business" class="btn btn-primary">查看财经新闻</a>
86 |                     </div>
87 |                 </div>
88 |             </div>
89 |         </div>
90 |     </div>
91 | {% endblock %}
92 | 


--------------------------------------------------------------------------------
/topics/templates/topics/header.html:
--------------------------------------------------------------------------------
 1 | {% load static %}
 2 | 
 3 | 
 4 | <nav class="navbar bg-primary navbar-expand-lg" data-bs-theme="dark">
 5 |     <div class="container-fluid">
 6 |         <a class="navbar-brand" href="/">
 7 |             <img src="{% static 'imgs/logo.jpeg' %}" class="img-thumbnail rounded-circle shadow-sm bg-white" alt="Bootstrap" width="40" height="40">
 8 |             <span class="navbar-brand mb-0 h1">爬虫百战成神</span>
 9 |         </a>
10 |         <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbarSupportedContent"
11 |                 aria-controls="navbarSupportedContent" aria-expanded="false" aria-label="Toggle navigation">
12 |             <span class="navbar-toggler-icon"></span>
13 |         </button>
14 |         <div class="collapse navbar-collapse flex-grow-0" id="navbarSupportedContent">
15 |             <ul class="navbar-nav">
16 |                 <li class="nav-item">
17 |                     <a class="nav-link" href="/">
18 |                         <i class="bi bi-house-door"></i> 介绍</a>
19 |                 </li>
20 |                 <li class="nav-item">
21 |                     <a class="nav-link" href="/list">
22 |                         <i class="bi bi-list-stars"></i> 题目列表</a>
23 |                 </li>
24 |                 <li class="nav-item">
25 |                     <a class="nav-link" href="/sandbox">
26 |                         <i class="bi bi-ui-checks-grid"></i> 试金场</a>
27 |                 </li>
28 |                 <li class="nav-item">
29 |                     <a class="nav-link" href="/tools">
30 |                         <i class="bi bi-tools"></i> 工具箱
31 |                     </a>
32 |                 </li>
33 |                 <li class="nav-item">
34 |                     <a class="nav-link" href="/api">
35 |                         <i class="bi bi-outlet"></i> API
36 |                     </a>
37 |                 </li>
38 |                 <li class="nav-item">
39 |                     <a class="nav-link" href="/shorthand">
40 |                         <i class="bi bi-journal-bookmark"></i> 速记手册
41 |                     </a>
42 |                 </li>
43 |                 <li class="nav-item">
44 |                     <a class="nav-link" href="/solutions">
45 |                         <i class="bi bi-code-square"></i> 题解
46 |                     </a>
47 |                 </li>
48 |                 <li class="nav-item">
49 |                     <a class="nav-link" href="https://cpython666.github.io/" target="_blank">
50 |                         <i class="bi bi-layout-text-window-reverse"></i>
51 |                         博客
52 |                         <i class="bi bi-arrow-up-right"
53 |                            style="font-size: 0.7em; position: relative; top: -7px; left: -5px;"></i>  <!-- 调整大小和位置 -->
54 |                     </a>
55 |                 </li>
56 | 
57 |                 <li class="nav-item">
58 |                     <a class="nav-link" href="https://github.com/cpython666/LearnSpider" target="_blank">
59 |                         <i class="bi-github" role="img" aria-label="GitHub"></i>
60 |                     </a>
61 |                 </li>
62 | 
63 |                 {# <li class="nav-item">#}
64 |                 {# <a class="nav-link disabled" aria-disabled="true">会员功能</a>#}
65 |                 {# </li>#}
66 |             </ul>
67 |             {# <form class="d-flex" role="search">#}
68 |             {# <input class="form-control me-2" type="search" placeholder="Search" aria-label="Search">#}
69 |             {# <button class="btn btn-outline-success" type="submit">Search</button>#}
70 |             {# </form>#}
71 |         </div>
72 |     </div>
73 | </nav>


--------------------------------------------------------------------------------
/topics/templates/topics/index/index.html:
--------------------------------------------------------------------------------
  1 | {% extends "topics/base.html" %}
  2 | {% load static %}
  3 | {% block answer %}
  4 | 
  5 | {% endblock %}
  6 | {% block content %}
  7 |     <style>
  8 |         /* 左侧广告固定定位 */
  9 |         .left-ad {
 10 |             position: fixed;
 11 |             left: 10px;
 12 |             top: 50%;
 13 |             transform: translateY(-50%);
 14 |             width: 220px;
 15 |             z-index: 1000;
 16 |         }
 17 | 
 18 |         /* 右侧广告固定定位 */
 19 |         .right-ad {
 20 |             position: fixed;
 21 |             right: 10px;
 22 |             top: 50%;
 23 |             transform: translateY(-50%);
 24 |             width: 220px;
 25 |             z-index: 1000;
 26 |         }
 27 | 
 28 |         /* 小屏幕隐藏广告 */
 29 |         @media (max-width: 991px) {
 30 |             .left-ad, .right-ad {
 31 |                 display: none;
 32 |             }
 33 |         }
 34 | 
 35 |         /* 主要内容容器，增加左右间距 */
 36 |         .content-container {
 37 |             margin-left: 250px; /* 留出左侧广告空间 */
 38 |             margin-right: 250px; /* 留出右侧广告空间 */
 39 |         }
 40 | 
 41 |         @media (max-width: 1199px) {
 42 |             .content-container {
 43 |                 margin-left: 0;
 44 |                 margin-right: 0;
 45 |             }
 46 |         }
 47 | 
 48 |         .card:hover {
 49 |             transform: translateY(-3px);
 50 |             box-shadow: 0 6px 16px rgba(0, 0, 0, 0.08);
 51 |             transition: all 0.2s ease;
 52 |         }
 53 |     </style>
 54 | 
 55 |     <div class="container mt-3">
 56 | 
 57 |         <!-- 左侧广告 -->
 58 |         <div class="left-ad d-none d-lg-block">
 59 |             <div class="card shadow-sm border-0">
 60 |                 <img src="{% static 'imgs/support/lky.png' %}" class="card-img-top rounded-top" alt="莱卡云">
 61 |                 <div class="card-body text-center">
 62 |                     <h5 class="card-title">莱卡云</h5>
 63 |                     <p class="card-text text-muted"><strong>低价格高性能服务器</strong>，速速上车，开启学习之旅～<br><br>莱卡云拥有精选华中/香港/美国/欧洲多种（境内境外）云服务器产品（境外服务器可以免备案），低至25元每月。
 64 |                     </p>
 65 |                     <a href="https://www.lcayun.com/aff/DECEDOZS" class="btn btn-primary btn-sm"
 66 |                        target="_blank">立即购买</a>
 67 |                 </div>
 68 |             </div>
 69 |         </div>
 70 | 
 71 |         <!-- 主要内容 -->
 72 |         <div class="content-container">
 73 |             <div class="text-center p-3">
 74 |                 <img src="{% static 'imgs/logo.jpeg' %}" class="img-thumbnail rounded-circle shadow-sm"
 75 |                      style="width: 180px;" alt="...">
 76 |                 <h1 class="mt-3">爬虫百战成神 - LearnSpider</h1>
 77 |                 <div class="mt-2">
 78 |                     <span class="badge rounded-pill bg-primary">靶场</span>
 79 |                     <span class="badge rounded-pill bg-secondary">爬虫</span>
 80 |                     <span class="badge rounded-pill bg-success">教程</span>
 81 |                     <span class="badge rounded-pill bg-danger">自动化</span>
 82 |                     <span class="badge rounded-pill bg-warning text-dark">一站式</span>
 83 |                     <span class="badge rounded-pill bg-info text-dark">DrissionPage</span>
 84 |                     <span class="badge rounded-pill bg-dark">Python</span>
 85 |                 </div>
 86 |             </div>
 87 | 
 88 |             <div class="p-3 bg-light rounded shadow-sm">
 89 |                 <div class="text-start" style="text-indent: 2em;">
 90 |                     不仅是一个练习场，也配套有每道题目的多种技术示例代码，文档讲解，视频演示。
 91 |                 </div>
 92 |                 <div class="text-start" style="text-indent: 2em;">
 93 |                     题目由易到难，由浅入深，想让大家在刷题与实践的过程中甚至是从零学会爬虫（因为思想学会后，剩下的代码其实就是工具的使用），在这个过程中增加自己对于代码和场景的理解。
 94 |                 </div>
 95 |                 <div class="text-start" style="text-indent: 2em;">
 96 |                     本项目目标覆盖爬虫初级，进阶和高级。涉及到requests，scrapy这些请求工具，还有selenium，drissionpage这些自动化工具框架。
 97 |                 </div>
 98 |                 <div class="text-start" style="text-indent: 2em;">
 99 |                     涉及到接口请求，静态页面解析，也涉及到代码混淆，接口加密，也包含各种抓包工具的使用，chrome开发者工具的使用等。
100 |                 </div>
101 |                 <div class="text-start" style="text-indent: 2em;">
102 |                     包括一些新颖的反爬技术，比如前端层面的反爬，svg反爬，css反爬，雪碧图等，也比如新兴的反爬技术比如wasm。
103 |                 </div>
104 |                 <div class="text-start" style="text-indent: 2em;">
105 |                     总之就是我会什么，就像教大家什么。所以此仓库的内容也会无限拓展。也欢迎大家的贡献。
106 |                 </div>
107 | 
108 |                 <div class="text-start mt-3" style="text-indent: 2em;">
109 |                     此仓库旨在让大家在刷题的过程中以结果和成就感驱动学习，学习到某个知识点后可以快速应用，从而感受到学到了东西，感受到爬虫是如此的简单有趣。而不是学完之后因为网站内容变动而没有刷题的地方，久而久之像没学一样。
110 |                 </div>
111 |                 <div class="text-start" style="text-indent: 2em;">
112 |                     并且本项目最想让大家养成举一反三，逻辑推理的思考思维习惯。
113 |                 </div>
114 |             </div>
115 | 
116 |             <div class="text-center mt-3">
117 |                 <h3>cpython666 出品</h3>
118 |                 <a class="btn btn-lg btn-primary mt-2" href="list" role="button">开启爬虫成神之旅</a>
119 |             </div>
120 |         </div>
121 | 
122 |         <!-- 右侧广告 -->
123 |         <div class="right-ad d-none d-lg-block">
124 |             <div class="card shadow-sm border-0">
125 |                 <img src="{% static 'imgs/support/yrx.png' %}" class="card-img-top rounded-top" alt="猿人学">
126 |                 <div class="card-body text-center">
127 |                     <h5 class="card-title">猿人学</h5>
128 |                     <p class="card-text text-muted">爬虫逆向反爬虫课程，3000爬虫er圈子，不定期聚会，行业顶级资源。<br><br>爬虫行业每10人中有一人就是猿人学的学员。<br><br><strong>报课提站长名字可享内部优惠价格。</strong>
129 |                     </p>
130 |                     <a href="https://match.yuanrenxue.cn/" class="btn btn-danger btn-sm" target="_blank">了解更多</a>
131 |                 </div>
132 |             </div>
133 |         </div>
134 | 
135 |     </div>
136 | 
137 |     <!-- 底部版权 -->
138 |     <footer class="bg-light text-center py-3 mt-3 shadow-sm">
139 |         <p class="mb-0">
140 |             © 2024 星梦起航. | <a href="https://beian.miit.gov.cn/#/Integrated/index"
141 |                                   target="_blank">豫ICP备2025114038号-2</a>
142 |         </p>
143 |     </footer>
144 |     <!-- Sponsors Section -->
145 |     <div class="container py-5" style="background: linear-gradient(to right, #f9fafb, #e6f0ff);">
146 |         <h2 class="text-center fw-semibold mb-4 text-dark">赞助商</h2>
147 |         <div class="row g-4 justify-content-center">
148 |             <div class="col-6 col-sm-4 col-md-3 col-lg-2">
149 |                 <a href="https://www.lcayun.com/aff/DECEDOZS" target="_blank"
150 |                    class="card h-100 text-decoration-none border-0 shadow-sm">
151 |                     <div class="d-flex align-items-center justify-content-center p-2 bg-white"
152 |                          style="aspect-ratio: 12/5;">
153 |                         <img src="{% static '/imgs/sponsors/lky_logo.png' %}" alt="莱卡云" class="img-fluid">
154 |                     </div>
155 |                 </a>
156 |             </div>
157 |             <div class="col-6 col-sm-4 col-md-3 col-lg-2">
158 |                 <a href="https://match.yuanrenxue.cn/" target="_blank"
159 |                    class="card h-100 text-decoration-none border-0 shadow-sm">
160 |                     <div class="d-flex align-items-center justify-content-center p-2 bg-white"
161 |                          style="aspect-ratio: 12/5;">
162 |                         <img src="{% static '/imgs/sponsors/yrx_logo.png' %}" alt="猿人学" class="img-fluid">
163 |                     </div>
164 |                 </a>
165 |             </div>
166 |             <div class="col-6 col-sm-4 col-md-3 col-lg-2">
167 |                 <a href="https://www.qg.net/product/proxyip.html?source=star" target="_blank"
168 |                    class="card h-100 text-decoration-none border-0 shadow-sm">
169 |                     <div class="d-flex align-items-center justify-content-center p-2 bg-white"
170 |                          style="aspect-ratio: 12/5;">
171 |                         <img src="{% static '/imgs/sponsors/qgwl_logo.png' %}" alt="青果网络" class="img-fluid">
172 |                     </div>
173 |                 </a>
174 |             </div>
175 |             <div class="col-6 col-sm-4 col-md-3 col-lg-2">
176 |                 <a href="https://evolution-host.com/" target="_blank"
177 |                    class="card h-100 text-decoration-none border-0 shadow-sm">
178 |                     <div class="d-flex align-items-center justify-content-center p-2 bg-white"
179 |                          style="aspect-ratio: 12/5;">
180 |                         <img src="{% static '/imgs/sponsors/evolution_host.png' %}" alt="Evolution Host"
181 |                              class="img-fluid">
182 |                     </div>
183 |                 </a>
184 |             </div>
185 |         </div>
186 |     </div>
187 | 
188 |     <!-- Friends Links Section -->
189 |     <div class="container py-5" style="background: linear-gradient(to right, #fff8f0, #fcebd5);">
190 |         <h2 class="text-center fw-semibold mb-4 text-dark">友情链接</h2>
191 |         <div class="row g-4 justify-content-center">
192 |             <div class="col-6 col-sm-4 col-md-3 col-lg-2">
193 |                 <a href="http://www.stardream.vip/" target="_blank"
194 |                    class="card h-100 text-decoration-none border-0 shadow-sm">
195 |                     <div class="d-flex align-items-center justify-content-center p-2 bg-white"
196 |                          style="aspect-ratio: 12/5;">
197 |                         <img src="{% static '/imgs/friends/stardream_logo.png' %}" alt="星梦起航" class="img-fluid">
198 |                     </div>
199 |                 </a>
200 |             </div>
201 |             <div class="col-6 col-sm-4 col-md-3 col-lg-2">
202 |                 <a href="http://www.learnspider.vip/" target="_blank"
203 |                    class="card h-100 text-decoration-none border-0 shadow-sm">
204 |                     <div class="d-flex align-items-center justify-content-center p-2 bg-white"
205 |                          style="aspect-ratio: 12/5;">
206 |                         <img src="{% static '/imgs/friends/learnspider_logo.png' %}" alt="爬虫百战成神"
207 |                              class="img-fluid">
208 |                     </div>
209 |                 </a>
210 |             </div>
211 |         </div>
212 |     </div>
213 | 
214 | {% endblock %}
215 | 


--------------------------------------------------------------------------------
/topics/templates/topics/index/list.html:
--------------------------------------------------------------------------------
  1 | {% extends "topics/base.html" %}
  2 | 
  3 | {% block answer %}{% endblock %}
  4 | 
  5 | {% block content %}
  6 |     <div class="card text-center">
  7 |         <div class="card-header h5">
  8 |             题目列表
  9 |         </div>
 10 |         <div class="card-body">
 11 | <!-- 添加分类筛选下拉选择框 -->
 12 | <div class="mb-3 d-flex align-items-center" style="gap: 0.5rem;">
 13 |     <label for="category-select" class="form-label" style="margin-bottom: 0;">筛选分类</label>
 14 |     <select class="form-select" id="category-select" style="width: 150px; padding: 0.25rem 0.5rem;">
 15 |         <option value="">所有分类</option>
 16 |         <!-- 在此处添加你的分类选项 -->
 17 |         <option value="序言">序言</option>
 18 |         <option value="成神之路">成神之路</option>
 19 |         <option value="hook">hook</option>
 20 |         <option value="骚操作">骚操作</option>
 21 |         <option value="概览教程">概览教程</option>
 22 |         <option value="xpath">xpath</option>
 23 |         <!-- 更多分类选项 -->
 24 |     </select>
 25 | </div>
 26 | 
 27 |                 <div class="table-container container flex-container justify-content-center">
 28 |                     <table class="table table-primary table-striped table-hover w-auto">
 29 |                         <thead>
 30 |                         <tr>
 31 |                             <th class="fixed-column" scope="col">#</th>
 32 |                             <th class="fixed-column" scope="col" data-bs-toggle="tooltip" data-bs-html="true"
 33 |                                 title="名称">
 34 |                                 名称
 35 |                             </th>
 36 |                             <th class="fixed-column" scope="col">链接</th>
 37 |                         </tr>
 38 |                         </thead>
 39 |                         <tbody id="data-body-fixed">
 40 |                         </tbody>
 41 |                     </table>
 42 |                     <div class="table-responsive">
 43 |                         <table class="table table-primary table-striped table-hover scrollable-table">
 44 |                             <thead>
 45 |                             <tr>
 46 |                                 <th scope="col">难度</th>
 47 |                                 <th scope="col">发布</th>
 48 |                                 <th scope="col">状态</th>
 49 |                                 <th scope="col">题解</th>
 50 |                                 <th scope="col">类别</th>
 51 |                                 <th scope="col">简介</th>
 52 |                             </tr>
 53 |                             </thead>
 54 |                             <tbody id="data-body-scroll">
 55 |                             </tbody>
 56 |                         </table>
 57 |                     </div>
 58 |                 </div>
 59 |                 <nav aria-label="Page navigation">
 60 |                     <ul class="pagination justify-content-center" id="pagination">
 61 |                     </ul>
 62 |                 </nav>
 63 |         </div>
 64 |     </div>
 65 | 
 66 | {% endblock %}
 67 | 
 68 | {% block script %}
 69 | <script>
 70 |     // 每页显示的记录数
 71 |     const itemsPerPage = 10;
 72 |     let currentPage = 1;
 73 |     let data = [];
 74 |     let filteredData = [];
 75 | 
 76 |     // 函数：生成带有默认提示框的单元格
 77 |     function createTooltipCell(text, type = 'text', link = '', tooltipTitle = text) {
 78 |         var cell;
 79 |         var element;
 80 | 
 81 |         if (type === 'link') {
 82 |             element = $('<a>').attr({
 83 |                 'href': link,
 84 |                 'target': '_blank'  // 新标签页打开链接
 85 |             }).text(text);
 86 |         } else {
 87 |             element = $('<span>').text(text);
 88 |         }
 89 | 
 90 |         element.attr({
 91 |             'data-bs-toggle': 'tooltip',
 92 |             'data-bs-html': 'true',
 93 |             'title': tooltipTitle
 94 |         });
 95 | 
 96 |         cell = $('<td>').append(element);
 97 |         return cell;
 98 |     }
 99 | 
100 |     // 函数：生成包含文本图标和视频图标的单元格
101 |     function createSolutionCell(docLink, videoLink) {
102 |         var cell = $('<td>');
103 |         var docIcon = $('<i class="bi bi-markdown" style="cursor:pointer; margin:0 5px;font-size: 1.2rem;"></i>');
104 |         var videoIcon = $('<i class="bi bi-play-btn" style="cursor:pointer; margin:0 5px;font-size: 1.2rem;"></i>');
105 | 
106 |         docIcon.attr('title', '文档解析').tooltip();
107 |         videoIcon.attr('title', '视频解析').tooltip();
108 | 
109 |         docIcon.on('click', function () {
110 |             window.open(docLink, '_blank');
111 |         });
112 | 
113 |         videoIcon.on('click', function () {
114 |             window.open(videoLink, '_blank');
115 |         });
116 | 
117 |         cell.append(docIcon).append(videoIcon);
118 |         return cell;
119 |     }
120 | 
121 |     function createStatusCell(status, type = "pass") {
122 |         var text = type === "pass" ? (status ? '通过' : '未通过') : (status ? '已发布' : '未发布');
123 |         var cell;
124 |         var element;
125 | 
126 |         if (status) {
127 |             element = $('<span>').text(text).addClass('badge bg-success');
128 |         } else {
129 |             element = $('<span>').text(text).addClass('badge bg-warning text-dark');
130 |         }
131 | 
132 |         element.attr({
133 |             'data-bs-toggle': 'tooltip',
134 |             'data-bs-html': 'true',
135 |             'title': text
136 |         });
137 | 
138 |         cell = $('<td>').append(element);
139 |         return cell;
140 |     }
141 | 
142 |     // 函数：渲染表格内容
143 |     function renderTable(page) {
144 |         $('#data-body-fixed').empty();
145 |         $('#data-body-scroll').empty();
146 | 
147 |         const start = (page - 1) * itemsPerPage;
148 |         const end = start + itemsPerPage;
149 | 
150 |         const pageData = filteredData.slice(start, end);
151 | 
152 |         $.each(pageData, function (index, topic) {
153 |             var row_fixed = $('<tr>');
154 |             var row_scroll = $('<tr>');
155 | 
156 |             row_fixed.append(createTooltipCell(topic.order_id));
157 |             row_fixed.append(createTooltipCell(topic.title));
158 |             row_fixed.append(createTooltipCell("Go", 'link', topic.response_path, "点击查看题目详情"));
159 | 
160 |             row_scroll.append(createTooltipCell(topic.difficulty));
161 |             row_scroll.append(createStatusCell(topic.published, type = "1"));
162 |             row_scroll.append(createStatusCell(topic.pass_status));
163 |             row_scroll.append(createSolutionCell(topic.solution_txt, topic.solution_video));
164 |             row_scroll.append(createTooltipCell(topic.category));
165 |             row_scroll.append(createTooltipCell(topic.detail));
166 | 
167 |             $('#data-body-fixed').append(row_fixed);
168 |             $('#data-body-scroll').append(row_scroll);
169 |         });
170 | 
171 |         // 初始化提示框
172 |         $('[data-bs-toggle="tooltip"]').tooltip();
173 |     }
174 | 
175 |     // 函数：渲染分页控件
176 |     function renderPagination(totalItems) {
177 |         const totalPages = Math.ceil(totalItems / itemsPerPage);
178 |         $('#pagination').empty();
179 | 
180 |         for (let i = 1; i <= totalPages; i++) {
181 |             const li = $('<li>').addClass('page-item').addClass(i === currentPage ? 'active' : '');
182 |             const a = $('<a>').addClass('page-link').attr('href', `?page=${i}`).text(i);
183 |             a.on('click', function (e) {
184 |                 e.preventDefault();
185 |                 currentPage = i;
186 |                 window.history.pushState({}, '', `?page=${i}`);
187 |                 renderTable(currentPage);
188 |                 renderPagination(filteredData.length);
189 |             });
190 |             li.append(a);
191 |             $('#pagination').append(li);
192 |         }
193 |     }
194 | // 函数：根据选择的分类过滤数据（忽略大小写）
195 | function filterDataByCategory(category) {
196 |     if (category === "null") {
197 |         filteredData = data.filter(topic => topic.category === null);
198 |     } else if (category) {
199 |         const lowerCaseCategory = category.toLowerCase();
200 |         filteredData = data.filter(topic => topic.category && topic.category.toLowerCase().includes(lowerCaseCategory));
201 |     } else {
202 |         filteredData = data;
203 |     }
204 | }
205 | 
206 | 
207 |     $(document).ready(function () {
208 |         const urlParams = new URLSearchParams(window.location.search);
209 |         const pageParam = urlParams.get('page');
210 |         if (pageParam) {
211 |             currentPage = parseInt(pageParam, 10);
212 |         }
213 | 
214 |         $.ajax({
215 |             url: '/api/topics/',
216 |             type: 'GET',
217 |             success: function (response) {
218 |                 data = response;
219 |                 filteredData = data; // 初始时显示全部数据
220 |                 renderTable(currentPage);
221 |                 renderPagination(filteredData.length);
222 |             },
223 |             error: function () {
224 |                 console.error('请求失败');
225 |             }
226 |         });
227 | 
228 |         // 处理分类筛选变更
229 |         $('#category-select').on('change', function () {
230 |             const selectedCategory = $(this).val();
231 |             filterDataByCategory(selectedCategory);
232 |             renderTable(1); // 筛选后重置为第一页
233 |             renderPagination(filteredData.length);
234 |         });
235 |     });
236 | </script>
237 | 
238 | {% endblock %}


--------------------------------------------------------------------------------
/topics/templates/topics/index/sandbox.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}试金场{% endblock %}
 4 | {% block answer %}
 5 |     <!-- 你可以在此处添加一些其他的内容或展示区 -->
 6 | {% endblock %}
 7 | {% block content %}
 8 |     <div class="container mt-4">
 9 |         <div class="row">
10 |             <!-- 工具展示：卡片布局 -->
11 |             <div class="col-12 col-md-4 mb-4">
12 |                 <!-- 新闻类型爬虫工具 -->
13 |                 <div class="card shadow-sm h-100">
14 |                     <img src="{% static 'imgs/sandbox/news.jpeg' %}" class="card-img-top" alt="新闻类型爬虫工具">
15 |                     <div class="card-body d-flex flex-column justify-content-between">
16 |                         <h5 class="card-title">星梦News</h5>
17 |                         <p class="card-text">这个工具可以帮助你爬取新闻网站的新闻内容，如标题、正文和作者等。</p>
18 |                         <a href="/sandbox/news" class="btn btn-primary align-self-center">进入工具</a>
19 |                     </div>
20 |                 </div>
21 |             </div>
22 | 
23 |             <div class="col-12 col-md-4 mb-4">
24 |                 <!-- 图片类型爬虫工具 -->
25 |                 <div class="card shadow-sm h-100">
26 |                     <img src="{% static 'imgs/sandbox/wallpaper.jpeg' %}" class="card-img-top" alt="图片类型爬虫工具">
27 |                     <div class="card-body d-flex flex-column justify-content-between">
28 |                         <h5 class="card-title">星梦WallPaper</h5>
29 |                         <p class="card-text">通过此工具，你可以爬取图片资源并进行批量下载。</p>
30 |                         <a href="/images_tool" class="btn btn-primary align-self-center">进入工具</a>
31 |                     </div>
32 |                 </div>
33 |             </div>
34 | 
35 |             <div class="col-12 col-md-4 mb-4">
36 |                 <!-- 视频评论爬虫工具 -->
37 |                 <div class="card shadow-sm h-100">
38 |                     <img src="{% static 'imgs/sandbox/video.jpeg' %}" class="card-img-top" alt="视频评论爬虫工具">
39 |                     <div class="card-body d-flex flex-column justify-content-between">
40 |                         <h5 class="card-title">星梦Video</h5>
41 |                         <p class="card-text">这个工具帮助你抓取视频平台的评论数据，包括点赞、回复等。</p>
42 |                         <a href="/videos_tool" class="btn btn-warning align-self-center">敬请期待～</a>
43 |                     </div>
44 |                 </div>
45 |             </div>
46 | 
47 |             <div class="col-12 col-md-4 mb-4">
48 |                 <!-- 音乐评论爬虫工具 -->
49 |                 <div class="card shadow-sm h-100">
50 |                     <img src="{% static 'imgs/sandbox/music.jpeg' %}" class="card-img-top" alt="音乐评论爬虫工具">
51 |                     <div class="card-body d-flex flex-column justify-content-between">
52 |                         <h5 class="card-title">星梦Music</h5>
53 |                         <p class="card-text">该工具可爬取音乐平台中的歌曲评论，并按用户或时间排序。</p>
54 |                         <a href="/music_tool" class="btn btn-warning align-self-center">敬请期待～</a>
55 |                     </div>
56 |                 </div>
57 |             </div>
58 | 
59 |             <div class="col-12 col-md-4 mb-4">
60 |                 <!-- 电商商品爬虫工具 -->
61 |                 <div class="card shadow-sm h-100">
62 |                     <img src="{% static 'imgs/sandbox/shop.jpeg' %}" class="card-img-top" alt="电商商品爬虫工具">
63 |                     <div class="card-body d-flex flex-column justify-content-between">
64 |                         <h5 class="card-title">星梦Shop</h5>
65 |                         <p class="card-text">此工具能帮助你爬取电商平台的商品信息，包括价格、评价、销量等。</p>
66 |                         <a href="/ecommerce_tool" class="btn btn-warning align-self-center">敬请期待～</a>
67 |                     </div>
68 |                 </div>
69 |             </div>
70 |         </div>
71 |     </div>
72 | {% endblock %}
73 | 


--------------------------------------------------------------------------------
/topics/templates/topics/index/shorthand.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}速记手册{% endblock %}
 4 | {% block answer %}
 5 | 
 6 | {% endblock %}
 7 | {% block content %}
 8 |     <div class="container text-center flex-column mt-1">
 9 |         <img src="{% static 'imgs/logo.jpeg' %}" class="img-thumbnail" style="width: 250px;" alt="...">
10 |         <div class="h1 m-1">
11 |             速记手册
12 |         </div>
13 |     </div>
14 | {% endblock %}


--------------------------------------------------------------------------------
/topics/templates/topics/index/tools.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}工具箱{% endblock %}
 4 | 
 5 | {% block answer %}
 6 |     <!-- 你可以在此处添加一些其他的内容或展示区 -->
 7 | {% endblock %}
 8 | 
 9 | {% block content %}
10 |     <div class="container-fluid mt-4">
11 |         <div class="row">
12 |             <!-- 左侧工具选项 -->
13 |             <div class="col-12 col-md-3">
14 |                 <div class="list-group">
15 |                     <a href="#tool1" class="list-group-item list-group-item-action active" data-bs-toggle="list"
16 |                        role="tab">
17 |                         工具1
18 |                     </a>
19 |                     <a href="#tool2" class="list-group-item list-group-item-action" data-bs-toggle="list" role="tab">
20 |                         工具2
21 |                     </a>
22 |                     <a href="#tool3" class="list-group-item list-group-item-action" data-bs-toggle="list" role="tab">
23 |                         工具3
24 |                     </a>
25 |                 </div>
26 |             </div>
27 | 
28 |             <!-- 右侧工具内容 -->
29 |             <div class="col-12 col-md-9">
30 |                 <div class="tab-content">
31 |                     <!-- 工具 1 内容 -->
32 |                     <div class="tab-pane fade show active" id="tool1" role="tabpanel">
33 |                         <div class="card shadow-sm">
34 |                             <img src="{% static 'imgs/tool1.jpg' %}" class="card-img-top" alt="工具1">
35 |                             <div class="card-body">
36 |                                 <h5 class="card-title">工具1</h5>
37 |                                 <p class="card-text">工具1的简短描述。它帮助你进行各种任务。</p>
38 |                                 <a href="/tool1" class="btn btn-primary">进入工具</a>
39 |                             </div>
40 |                         </div>
41 |                     </div>
42 | 
43 |                     <!-- 工具 2 内容 -->
44 |                     <div class="tab-pane fade" id="tool2" role="tabpanel">
45 |                         <div class="card shadow-sm">
46 |                             <img src="{% static 'imgs/tool2.jpg' %}" class="card-img-top" alt="工具2">
47 |                             <div class="card-body">
48 |                                 <h5 class="card-title">工具2</h5>
49 |                                 <p class="card-text">工具2的简短描述。它用于处理复杂的数据分析任务。</p>
50 |                                 <a href="/tool2" class="btn btn-primary">进入工具</a>
51 |                             </div>
52 |                         </div>
53 |                     </div>
54 | 
55 |                     <!-- 工具 3 内容 -->
56 |                     <div class="tab-pane fade" id="tool3" role="tabpanel">
57 |                         <div class="card shadow-sm">
58 |                             <img src="{% static 'imgs/tool3.jpg' %}" class="card-img-top" alt="工具3">
59 |                             <div class="card-body">
60 |                                 <h5 class="card-title">工具3</h5>
61 |                                 <p class="card-text">工具3是一个高效的文本处理工具，适用于各种文本分析需求。</p>
62 |                                 <a href="/tool3" class="btn btn-primary">进入工具</a>
63 |                             </div>
64 |                         </div>
65 |                     </div>
66 |                 </div>
67 |             </div>
68 |         </div>
69 |     </div>
70 | {% endblock %}
71 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/111.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 雪碧图
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>雪碧图</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/112.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 雪碧图
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>雪碧图</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/ajax.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}
 4 | 何为动态网页
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h1>您好🦆, 爬虫er~👋</h1>
 8 |     <h3>
 9 |    什么是动态网页呢？🤠
10 |     </h3>
11 |     查看这个网页的源代码，可以找到数据吗？<br>
12 |     请问：动态网页中加载的数据在浏览器的开发者工具的网络标签栏下面的哪个筛选框里？【完整的内容，区分大小写，包括分隔符】
13 | </div>
14 | {% endblock %}
15 | 
16 | {% block content %}
17 | <div class="container mt-5">
18 |         <h1 class="mb-4">动态内容</h1>
19 |         <div id="content">
20 |             <!-- 动态内容将插入到这里 -->
21 |         </div>
22 |     </div>
23 |     <script>
24 |         $(document).ready(function() {
25 |             $.ajax({
26 |                 url: '/api/ajax/', // API 接口
27 |                 type: 'GET',
28 |                 success: function(response) {
29 |                     // 假设 API 返回的数据格式为：{ "title": "xxx", "author": "xxx", "date": "xxx", "content": "xxx" }
30 |                     const data = response;
31 | 
32 |                     // 创建内容元素
33 |                     const contentElement = `
34 |                         <div class="card">
35 |                             <div class="card-header">
36 |                                 ${data.title}
37 |                             </div>
38 |                             <div class="card-body">
39 |                                 <h5 class="card-title">${data.author}</h5>
40 |                                 <h6 class="card-subtitle mb-2 text-muted">${data.date}</h6>
41 |                                 <p class="card-text">${data.content}</p>
42 |                             </div>
43 |                         </div>
44 |                     `;
45 | 
46 |                     // 将内容插入到页面中
47 |                     $('#content').html(contentElement);
48 |                 },
49 |                 error: function() {
50 |                     $('#content').html('<div class="alert alert-danger" role="alert">内容加载失败</div>');
51 |                 }
52 |             });
53 |         });
54 |     </script>
55 | {% endblock %}
56 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/asyncio.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 协程，不是携程奥😁
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>协程，不是携程奥😁</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/course-buying-guide.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 爬虫买课指南
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h3>
 8 | 又又又看完一篇文章之后，这个时候是否对于报班学习有一定认识了呢？
 9 | 请回答：《有点感觉了》
10 | </h3>
11 | {% endblock %}
12 | {% block content %}
13 | <h1>爬虫买课指南</h1>
14 |     <h3>
15 |     学习爬虫需要报班吗？你需要知道的事情。
16 |     </h3>
17 | <div class="alert alert-success" role="alert">
18 | 文章在这里：<a href="https://github.com/cpython666/LearnSpider/issues/3" class="link-success" target="_blank">爬虫买课指南</a>
19 | </div>
20 | {% endblock %}
21 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/css-sprite.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 雪碧图
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>雪碧图</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/demo.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html lang="en">
 3 | <head>
 4 |     <meta charset="ISO-8859-1">
 5 | {#    <meta charset="UTF-8">#}
 6 |     <title>Title</title>
 7 | </head>
 8 | <body>
 9 | 吧小伙伴还是喜爱u不误
10 | </body>
11 | </html>


--------------------------------------------------------------------------------
/topics/templates/topics/pages/demo_get_server_time.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html lang="en">
 3 | <head>
 4 |     <meta charset="UTF-8">
 5 |     <meta name="viewport"
 6 |           content="width=device-width, user-scalable=no, initial-scale=1.0, maximum-scale=1.0, minimum-scale=1.0">
 7 |     <meta http-equiv="X-UA-Compatible" content="ie=edge">
 8 |     <title>Document</title>
 9 | </head>
10 | <body>
11 | <h1 id="myHeader"></h1>
12 | </body>
13 | <script>
14 |     async function fetchServerTimestamp() {
15 |   try {
16 |     const response = await fetch('/api/server-timestamp/');
17 |     if (!response.ok) {
18 |       throw new Error('Network response was not ok');
19 |     }
20 |     const data = await response.json();
21 |     return data.timestamp;
22 |   } catch (error) {
23 |     console.error('Failed to fetch server timestamp:', error);
24 |     return null;
25 |   }
26 | }
27 | 
28 | function decodeTimestamp(encodedTimestamp) {
29 |   // 使用 Base64 解码
30 |   const decodedStr = atob(encodedTimestamp);
31 | 
32 |   // 提取和数值和时间戳
33 |   const digitSum = parseInt(decodedStr.slice(0, -13), 10);
34 |   const timestamp = parseInt(decodedStr.slice(-13), 10);
35 | 
36 |   // 验证和数值
37 |   const calculatedSum = Array.from(String(timestamp)).reduce((acc, digit) => acc + parseInt(digit, 10), 0);
38 |   if (calculatedSum !== digitSum) {
39 |     throw new Error('Invalid timestamp: digit sum does not match');
40 |   }
41 | 
42 |   return timestamp;
43 | }
44 | 
45 | // 使用示例
46 | fetchServerTimestamp().then(encodedTimestamp => {
47 |   if (encodedTimestamp) {
48 |     try {
49 |       const timestamp = decodeTimestamp(encodedTimestamp);
50 |               // 获取 h1 标签
51 |         var h1Element = document.getElementById('myHeader');
52 |             // 设置 h1 标签的内容
53 |             h1Element.textContent = 'Decoded timestamp:'+timestamp;
54 |       console.log('Decoded timestamp:', timestamp);
55 |       // 在这里使用服务器时间戳进行相关操作
56 |     } catch (error) {
57 |       console.error('Failed to decode timestamp:', error);
58 |     }
59 |   }
60 | });
61 | 
62 | </script>
63 | </html>


--------------------------------------------------------------------------------
/topics/templates/topics/pages/devtools.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 开发者工具
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>开发者工具</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/easy-spider.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 对爬虫祛魅
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h3>
 8 | 看完本篇文章之后，你还害怕爬虫吗？
 9 | 请回答：《不害怕！！！》
10 | </h3>
11 | {% endblock %}
12 | {% block content %}
13 | <h1>对爬虫祛魅</h1>
14 |     <h3>
15 |     知己知彼，方能百战不胜，最好对将要学习的东西先有个大局观。不然会一次又一次遇到新东西，好像看不到尽头，进而磨灭热情。
16 |     </h3>
17 | <div class="alert alert-success" role="alert">
18 | 文章在这里：<a href="https://github.com/cpython666/LearnSpider/issues/1" class="link-success" target="_blank">对爬虫祛魅</a>
19 | </div>
20 | {% endblock %}
21 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/h1-6.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 杂牌军写的前端代码
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>杂牌军写的前端代码</h1>
 9 | 
10 | 
11 | 
12 | {% endblock %}
13 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/hello-get.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | GET请求
 5 | {% endblock %}
 6 | 
 7 | {% block question %}
 8 | <h1>GET 请求介绍</h1>
 9 |     <h3>
10 |     GET 请求是 HTTP 协议中最常见的请求方法之一，通常用于从服务器获取资源。你了解它吗？<br>
11 |     请回答：【了解】或【不了解】
12 |     </h3>
13 | {% endblock %}
14 | 
15 | {% block content %}
16 | <p>
17 |     GET 请求是用于向服务器请求数据的一种方法。它的特点是：所有的数据（如查询参数）都会附加在 URL 中，
18 |     并通过浏览器的地址栏进行发送。GET 请求不会对服务器的数据进行修改，只是用于获取资源。
19 | </p>
20 | <h4>GET 请求的特点：</h4>
21 | <ul>
22 |     <li>请求参数通过 URL 传递（例如：`?name=value&age=30`）。</li>
23 |     <li>数据大小受限（通常约为 2048 字符）。</li>
24 |     <li>请求是安全的，因为它不会修改服务器上的资源。</li>
25 |     <li>GET 请求通常是幂等的，也就是说多次请求相同的 URL 会得到相同的响应。</li>
26 |     <li>GET 请求支持浏览器缓存。</li>
27 | </ul>
28 | 
29 | <h4>示例：</h4>
30 | <p>如果我们通过以下 GET 请求访问一个页面：</p>
31 | <pre>
32 | GET /search?q=python HTTP/1.1
33 | Host: example.com
34 | </pre>
35 | 
36 | <p>服务器会根据查询参数 `q=python` 返回相应的资源（比如搜索结果）。</p>
37 | {% endblock %}
38 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/hello-post-form.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 |     POST请求-表单请求体
 5 | {% endblock %}
 6 | 
 7 | {% block question %}
 8 |     <h1>POST 请求类型：JSON 与表单的区别</h1>
 9 |     <h3>
10 |         你知道 POST 请求发送数据的不同格式吗？我们有 JSON 格式和表单格式的区别哦！<br>
11 |         请回答：【了解】或【不了解】
12 |     </h3>
13 | {% endblock %}
14 | 
15 | {% block content %}
16 |     <p>
17 |         POST 请求是 HTTP 协议中常用的一种请求方法，主要用于向服务器提交数据。在提交数据时，POST 请求有不同的
18 |         **数据格式**，其中最常用的有：
19 |     </p>
20 | 
21 |     <div id="responseContent"></div>
22 | 
23 |     <script>
24 |         $(document).ready(function () {
25 |             // 发送 GET 请求，获取 POST 请求类型的介绍
26 |             $.ajax({
27 |                 url: '/api/post_intro_form/',  // 后端接口地址
28 |                 type: 'POST',
29 |                 data: {
30 |                     'password': 'post'
31 |                 },
32 |                 success: function (response) {
33 |                     // 将返回的内容插入到页面中
34 |                     $("#responseContent").html(`
35 |                         <h2>${response.title}</h2>
36 |                         <div>${response.content}</div>
37 |                     `);
38 |                 },
39 |                 error: function () {
40 |                     alert("请求失败，请重试！");
41 |                 }
42 |             });
43 |         });
44 |     </script>
45 | 
46 | {% endblock %}
47 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/hello-post-json.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 |     POST请求-JSON请求体
 5 | {% endblock %}
 6 | 
 7 | {% block question %}
 8 |     <h1>POST 请求介绍</h1>
 9 |     <h3>
10 |         POST 请求用于向服务器提交数据，你知道怎么通过代码发送一个 POST 请求吗？<br>
11 |         请回答：【了解】或【不了解】
12 |     </h3>
13 | {% endblock %}
14 | 
15 | {% block content %}
16 | 
17 |     <div id="introContent"></div>
18 | 
19 |     <script>
20 |         $(document).ready(function () {
21 |             // 发送 POST 请求获取关于 POST 请求的介绍内容
22 |             $.ajax({
23 |                 url: '/api/post_intro_json/',  // 后端接口地址
24 |                 type: 'POST',
25 |                 contentType: 'application/json',  // 请求头指定发送 JSON 数据
26 |                 data: JSON.stringify({  // 将 JavaScript 对象转换为 JSON 字符串
27 |                     password: 'post'
28 |                 }),
29 |                 success: function (response) {
30 |                     // 请求成功后，将返回的内容插入到页面中
31 |                     $("#introContent").html(`
32 |                         <h2>${response.title}</h2>
33 |                         <div>${response.content}</div>
34 |                     `);
35 |                 },
36 |                 error: function () {
37 |                     // 请求失败时的处理
38 |                     alert("请求失败，请重试！");
39 |                 }
40 |             });
41 |         });
42 |     </script>
43 | 
44 | {% endblock %}
45 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/intro.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 题目介绍
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h3>
 8 | 主要介绍这些题目的特点
 9 |     <br>
10 | 
11 | 请问：如何获取到数据呢？请回答：【灵活变通】
12 | </h3>
13 | {% endblock %}
14 | {% block content %}
15 | <h1>题目介绍</h1>
16 |     <h3>
17 |     不管你是用什么方式，自动化，协议，甚至是，复制粘贴。没错，不择手段，只要你能够获取答案！当然，我会尽量把题目设计成让你无法用手动解决，嘿嘿嘿～。
18 |      <br>   尽量做到从易到难，由浅入深，遇到黄色报错页面不要慌，是因为题目还没出到那里。
19 |     </h3>
20 | {% endblock %}
21 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/lsp-spider.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}
 4 | 色图收集者
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h1>您好🦆, 爬虫er~👋</h1>
 8 |     <h3>
 9 |     下面是一些精彩的色图展示，请欣赏！🎨
10 |     </h3>
11 |     将所有的图片下载到本地，存放到【学习资料】文件夹，图片命名为：标题-描述-图片名
12 |     <br>
13 |     偷着乐吧小伙子，这道题目答案是：【我只是爱学习】
14 |     <br>
15 |     记得常常温习哟～😉
16 |     <div class="alert alert-info" role="alert">
17 |     可能会有小伙伴嗤之以鼻。就这？😑，为了仓库的大小和未成年考虑，图片的大小和档次被压缩。<br>
18 | 但是附上图片的来源网站【全部都是4k大图奥😉】：<a href="https://wallhaven.cc/toplist" class="link-success" target="_blank">https://wallhaven.cc/toplist</a>
19 | </div>
20 | {% endblock %}
21 | 
22 | {% block content %}
23 | <div class="container">
24 |     <h1 class="mt-5">色图收集者</h1>
25 |     <div class="row">
26 |         <!-- 色图块 1 -->
27 |         <div class="col-md-4">
28 |             <div class="card mb-4">
29 |                 <img src="{% static 'imgs/setu/1.jpg' %}" class="card-img-top" alt="色图 1">
30 |                 <div class="card-body">
31 |                     <h5 class="card-title">色图标题 1</h5>
32 |                     <p class="card-text">描述：这是一幅色彩鲜艳的图像，展示了美丽的风景。</p>
33 |                 </div>
34 |             </div>
35 |         </div>
36 |         <!-- 色图块 2 -->
37 |         <div class="col-md-4">
38 |             <div class="card mb-4">
39 |                 <img src="{% static 'imgs/setu/2.jpg' %}" class="card-img-top" alt="色图 2">
40 |                 <div class="card-body">
41 |                     <h5 class="card-title">色图标题 2</h5>
42 |                     <p class="card-text">描述：这幅图像展示了丰富的色彩和动态的设计。</p>
43 |                 </div>
44 |             </div>
45 |         </div>
46 |         <!-- 色图块 3 -->
47 |         <div class="col-md-4">
48 |             <div class="card mb-4">
49 |                 <img src="{% static 'imgs/setu/3.jpg' %}" class="card-img-top" alt="色图 3">
50 |                 <div class="card-body">
51 |                     <h5 class="card-title">色图标题 3</h5>
52 |                     <p class="card-text">描述：这幅图像以抽象的形式展现了色彩的碰撞。</p>
53 |                 </div>
54 |             </div>
55 |         </div>
56 |         <!-- 色图块 4 -->
57 |         <div class="col-md-4">
58 |             <div class="card mb-4">
59 |                 <img src="{% static 'imgs/setu/1.png' %}" class="card-img-top" alt="色图 4">
60 |                 <div class="card-body">
61 |                     <h5 class="card-title">色图标题 4</h5>
62 |                     <p class="card-text">描述：这幅图像以优雅的色调展示了艺术的美感。</p>
63 |                 </div>
64 |             </div>
65 |         </div>
66 |         <!-- 色图块 5 -->
67 |         <div class="col-md-4">
68 |             <div class="card mb-4">
69 |                 <img src="{% static 'imgs/setu/2.png' %}" class="card-img-top" alt="色图 5">
70 |                 <div class="card-body">
71 |                     <h5 class="card-title">色图标题 5</h5>
72 |                     <p class="card-text">描述：这幅图像充满了生动的色彩和细腻的细节。</p>
73 |                 </div>
74 |             </div>
75 |         </div>
76 |         <!-- 色图块 6 -->
77 |         <div class="col-md-4">
78 |             <div class="card mb-4">
79 |                 <img src="{% static 'imgs/setu/3.png' %}" class="card-img-top" alt="色图 6">
80 |                 <div class="card-body">
81 |                     <h5 class="card-title">色图标题 6</h5>
82 |                     <p class="card-text">描述：这幅图像展示了色彩和形状的完美结合。</p>
83 |                 </div>
84 |             </div>
85 |         </div>
86 |     </div>
87 | </div>
88 | {% endblock %}
89 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/news.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 新闻收集者
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h1>您好🦆, 爬虫er~👋</h1>
 8 |     <h3>
 9 |     以下是一些与爬虫相关的新闻，希望你喜欢！🕷
10 |     </h3>
11 |     获取所有的新闻信息，输出这样的格式：[{"title":"xxx",{"auther":"xxx",{"publish_date":"xxx",{"detail":"xxx",}...]
12 |     <br>
13 |     成功获取了吗？请回答【成功了！】
14 | {% endblock %}
15 | 
16 | {% block content %}
17 | <div class="container">
18 |     <h1 class="mt-5">新闻收集者</h1>
19 |     <div class="row">
20 |         <!-- 新闻块 1 -->
21 |         <div class="col-md-4">
22 |             <div class="card mb-4">
23 |                 <div class="card-body">
24 |                     <h5 class="card-title">Python 爬虫挑战赛圆满结束</h5>
25 |                     <h6 class="card-subtitle mb-2 text-muted">发布日期: 2024-07-30</h6>
26 |                     <p class="card-text">作者: 爬虫大师</p>
27 |                     <p class="card-text">本次 Python 爬虫挑战赛吸引了来自全球的数百名爬虫爱好者。经过激烈的比拼，最终产生了前三名获奖者。他们的作品展示了爬虫技术的无限可能。</p>
28 |                 </div>
29 |             </div>
30 |         </div>
31 |         <!-- 新闻块 2 -->
32 |         <div class="col-md-4">
33 |             <div class="card mb-4">
34 |                 <div class="card-body">
35 |                     <h5 class="card-title">新型反爬虫技术亮相科技大会</h5>
36 |                     <h6 class="card-subtitle mb-2 text-muted">发布日期: 2024-07-28</h6>
37 |                     <p class="card-text">作者: 安全先锋</p>
38 |                     <p class="card-text">在今年的科技大会上，多个公司展示了他们最新的反爬虫技术。这些技术旨在保护网站内容，防止未经授权的爬取行为，引起了广泛关注。</p>
39 |                 </div>
40 |             </div>
41 |         </div>
42 |         <!-- 新闻块 3 -->
43 |         <div class="col-md-4">
44 |             <div class="card mb-4">
45 |                 <div class="card-body">
46 |                     <h5 class="card-title">知名数据科学家分享爬虫最佳实践</h5>
47 |                     <h6 class="card-subtitle mb-2 text-muted">发布日期: 2024-07-25</h6>
48 |                     <p class="card-text">作者: 数据达人</p>
49 |                     <p class="card-text">著名数据科学家在最近的研讨会上分享了爬虫的最佳实践，包括如何处理反爬机制、如何提高爬虫效率以及数据清洗的技巧，受到了与会者的热烈欢迎。</p>
50 |                 </div>
51 |             </div>
52 |         </div>
53 |         <!-- 新闻块 4 -->
54 |         <div class="col-md-4">
55 |             <div class="card mb-4">
56 |                 <div class="card-body">
57 |                     <h5 class="card-title">Web Scraping 在商业中的应用</h5>
58 |                     <h6 class="card-subtitle mb-2 text-muted">发布日期: 2024-07-22</h6>
59 |                     <p class="card-text">作者: 商业分析师</p>
60 |                     <p class="card-text">越来越多的企业开始利用 Web Scraping 技术来收集竞争对手的信息、市场趋势以及客户反馈。本文介绍了几种典型的商业应用案例。</p>
61 |                 </div>
62 |             </div>
63 |         </div>
64 |         <!-- 新闻块 5 -->
65 |         <div class="col-md-4">
66 |             <div class="card mb-4">
67 |                 <div class="card-body">
68 |                     <h5 class="card-title">AI 与爬虫技术的结合：未来展望</h5>
69 |                     <h6 class="card-subtitle mb-2 text-muted">发布日期: 2024-07-20</h6>
70 |                     <p class="card-text">作者: 技术前沿</p>
71 |                     <p class="card-text">随着 AI 技术的发展，爬虫技术也在不断进步。未来，AI 将在爬虫中发挥更加重要的作用，帮助爬虫变得更加智能和高效。</p>
72 |                 </div>
73 |             </div>
74 |         </div>
75 |         <!-- 新闻块 6 -->
76 |         <div class="col-md-4">
77 |             <div class="card mb-4">
78 |                 <div class="card-body">
79 |                     <h5 class="card-title">爬虫技术在学术研究中的应用</h5>
80 |                     <h6 class="card-subtitle mb-2 text-muted">发布日期: 2024-07-18</h6>
81 |                     <p class="card-text">作者: 学术达人</p>
82 |                     <p class="card-text">爬虫技术在学术研究中有着广泛的应用，例如数据收集、文献综述和社会网络分析。本文探讨了几种典型的学术应用场景。</p>
83 |                 </div>
84 |             </div>
85 |         </div>
86 |     </div>
87 | </div>
88 | {% endblock %}
89 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/pagination-1.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}
 4 | 翻页网页
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h1>您好🦆, 爬虫er~👋</h1>
 8 |     <h3>
 9 |    这是需要翻页的网页🫣
10 |     </h3>
11 |     它与上一道题目没太大区别对吧，只是多加了一个循环。<br>
12 |     请问：第一百页返回的内容是什么？【一个json格式的答案】
13 | </div>
14 | {% endblock %}
15 | 
16 | {% block content %}
17 | <div class="container mt-5">
18 |         <h1 class="mb-4">翻页内容</h1>
19 |         <div id="content">
20 |             <!-- 动态内容将插入到这里 -->
21 |         </div>
22 |         <nav aria-label="Page navigation">
23 |             <ul class="pagination justify-content-center">
24 |                 <li class="page-item">
25 |                     <a class="page-link" href="#" id="prev-page">上一页</a>
26 |                 </li>
27 |                 <li class="page-item">
28 |                     <span class="page-link" id="current-page">1</span>
29 |                 </li>
30 |                 <li class="page-item">
31 |                     <a class="page-link" href="#" id="next-page">下一页</a>
32 |                 </li>
33 |             </ul>
34 |         </nav>
35 |     </div>
36 | 
37 |     <script>
38 |         let currentPage = 1;
39 | 
40 |         function fetchData(page) {
41 |             $.ajax({
42 |                 url: `/api/pagination1/${page}/`, // API 接口
43 |                 type: 'GET',
44 |                 success: function(response) {
45 |                     // 假设 API 返回的数据格式为：{ "data": "xxx" }
46 |                     const data = response.data;
47 | 
48 |                     // 更新内容
49 |                     $('#content').html(`<div class="card"><div class="card-body">${data}</div></div>`);
50 | 
51 |                     // 更新当前页码显示
52 |                     $('#current-page').text(page);
53 |                 },
54 |                 error: function() {
55 |                     $('#content').html('<div class="alert alert-danger" role="alert">内容加载失败</div>');
56 |                 }
57 |             });
58 |         }
59 | 
60 |         $(document).ready(function() {
61 |             // 初始化加载第一页内容
62 |             fetchData(currentPage);
63 | 
64 |             // 上一页按钮点击事件
65 |             $('#prev-page').click(function(e) {
66 |                 e.preventDefault();
67 |                 if (currentPage > 1) {
68 |                     currentPage--;
69 |                     fetchData(currentPage);
70 |                 }
71 |             });
72 | 
73 |             // 下一页按钮点击事件
74 |             $('#next-page').click(function(e) {
75 |                 e.preventDefault();
76 |                 currentPage++;
77 |                 fetchData(currentPage);
78 |             });
79 |         });
80 |     </script>
81 | {% endblock %}
82 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/pagination-2.html:
--------------------------------------------------------------------------------
  1 | {% extends "topics/base.html" %}
  2 | 
  3 | {% block title %}翻页网页2{% endblock %}
  4 | {% block question %}
  5 | <h1>您好🦆, 爬虫er~👋</h1>
  6 |     <h3>
  7 |    出bug了吗？🫣
  8 |     </h3>
  9 |     怎么又回到列表页了？哎，对不起了🥺，直接把题目列表页面copy过来了。<br>
 10 |     发现这个翻页列表与上个翻页列表的区别了吧！请问每页都点一下请求了几次数据接口？
 11 | </div>
 12 | {% endblock %}
 13 | {% block content %}
 14 |     <div class="card text-center">
 15 |         <div class="card-header h5">
 16 |             题目列表
 17 |         </div>
 18 |         <div class="card-body">
 19 |                 <div class="table-container container flex-container justify-content-center">
 20 |                     <table class="table table-primary table-striped table-hover w-auto">
 21 |                         <thead>
 22 |                         <tr>
 23 |                             <th class="fixed-column" scope="col">#</th>
 24 |                             <th class="fixed-column" scope="col" data-bs-toggle="tooltip" data-bs-html="true"
 25 |                                 title="名称">
 26 |                                 名称
 27 |                             </th>
 28 |                             <th class="fixed-column" scope="col">链接</th>
 29 |                         </tr>
 30 |                         </thead>
 31 |                         <tbody id="data-body-fixed">
 32 |                         </tbody>
 33 |                     </table>
 34 |                     <div class="table-responsive">
 35 |                         <table class="table table-primary table-striped table-hover scrollable-table">
 36 |                             <thead>
 37 |                             <tr>
 38 |                                 <th scope="col">难度</th>
 39 |                                 <th scope="col">状态</th>
 40 |                                 <th scope="col">题解</th>
 41 |                                 <th scope="col">类别</th>
 42 |                                 <th scope="col">简介</th>
 43 |                             </tr>
 44 |                             </thead>
 45 |                             <tbody id="data-body-scroll">
 46 |                             </tbody>
 47 |                         </table>
 48 |                     </div>
 49 |                 </div>
 50 |                 <nav aria-label="Page navigation">
 51 |                     <ul class="pagination justify-content-center" id="pagination">
 52 |                     </ul>
 53 |                 </nav>
 54 |         </div>
 55 |     </div>
 56 | 
 57 | {% endblock %}
 58 | 
 59 | {% block script %}
 60 |     <script>
 61 |         // 每页显示的记录数
 62 |         const itemsPerPage = 10;
 63 |         let currentPage = 1;
 64 |         let data = [];
 65 | 
 66 |         // 函数：生成带有默认提示框的单元格
 67 |         function createTooltipCell(text, type = 'text', link = '', tooltipTitle = text) {
 68 |             var cell;
 69 |             var element;
 70 | 
 71 |             if (type === 'link') {
 72 |                 element = $('<a>').attr({
 73 |                     'href': link,
 74 |                     'target': '_blank'  // 新标签页打开链接
 75 |                 }).text(text);
 76 |             } else {
 77 |                 element = $('<span>').text(text);
 78 |             }
 79 | 
 80 |             element.attr({
 81 |                 'data-bs-toggle': 'tooltip',
 82 |                 'data-bs-html': 'true',
 83 |                 'title': tooltipTitle
 84 |             });
 85 | 
 86 |             cell = $('<td>').append(element);
 87 |             return cell;
 88 |         }
 89 | 
 90 |         // 函数：生成包含文本图标和视频图标的单元格
 91 |         function createSolutionCell(docLink, videoLink) {
 92 |             var cell = $('<td>');
 93 |             {# style="cursor:pointer; margin-right: 10px;"#}
 94 |             var docIcon = $('<i class="bi bi-markdown" style="cursor:pointer; margin:0 5px;font-size: 1.2rem;"></i>');
 95 |             var videoIcon = $('<i class="bi bi-play-btn" style="cursor:pointer; margin:0 5px;font-size: 1.2rem;"></i>');
 96 | 
 97 |             docIcon.attr('title', '文档解析').tooltip();
 98 |             videoIcon.attr('title', '视频解析').tooltip();
 99 | 
100 |             docIcon.on('click', function () {
101 |                 window.open(docLink, '_blank');
102 |             });
103 | 
104 |             videoIcon.on('click', function () {
105 |                 window.open(videoLink, '_blank');
106 |             });
107 | 
108 |             cell.append(docIcon).append(videoIcon);
109 |             return cell;
110 |         }
111 | 
112 |         function createStatusCell(status) {
113 |             var text = status ? '通过' : '未通过'
114 |             var cell;
115 |             var element;
116 |             if (status) {
117 |                 element = $('<span>').text(text).addClass('badge bg-success');
118 | 
119 |             } else {
120 |                 element = $('<span>').text(text).addClass('badge bg-warning  text-dark');
121 | 
122 |             }
123 | 
124 |             element.attr({
125 |                 'data-bs-toggle': 'tooltip',
126 |                 'data-bs-html': 'true',
127 |                 'title': text
128 |             });
129 | 
130 |             cell = $('<td>').append(element);
131 |             return cell;
132 |         }
133 | 
134 |         // 函数：渲染表格内容
135 |         function renderTable(page) {
136 |             $('#data-body-fixed').empty();
137 |             $('#data-body-scroll').empty();
138 | 
139 |             const start = (page - 1) * itemsPerPage;
140 |             const end = start + itemsPerPage;
141 | 
142 |             const pageData = data.slice(start, end);
143 | 
144 |             $.each(pageData, function (index, topic) {
145 |                 var row_fixed = $('<tr>');
146 |                 var row_scroll = $('<tr>');
147 | 
148 |                 row_fixed.append(createTooltipCell(topic.order_id));
149 |                 row_fixed.append(createTooltipCell(topic.title));
150 |                 row_fixed.append(createTooltipCell("Go", 'link', topic.response_path, "点击查看题目详情"));
151 | 
152 |                 row_scroll.append(createTooltipCell(topic.difficulty));
153 |                 row_scroll.append(createStatusCell(topic.pass_status));
154 |                 row_scroll.append(createSolutionCell(topic.solution_txt, topic.solution_video));
155 |                 row_scroll.append(createTooltipCell(topic.category));
156 |                 row_scroll.append(createTooltipCell(topic.des));
157 | 
158 |                 {#row_scroll.append(createTooltipCell(topic.goal));#}
159 |                 {#row_scroll.append(createTooltipCell(topic.question));#}
160 |                 {#row_scroll.append(createTooltipCell(topic.difficulty_score));#}
161 |                 {#row_scroll.append(createTooltipCell(topic.points));#}
162 | 
163 |                 $('#data-body-fixed').append(row_fixed);
164 |                 $('#data-body-scroll').append(row_scroll);
165 |             });
166 | 
167 |             // 初始化提示框
168 |             $('[data-bs-toggle="tooltip"]').tooltip();
169 |         }
170 | 
171 |         // 函数：渲染分页控件
172 | function renderPagination(totalItems) {
173 |     const totalPages = Math.ceil(totalItems / itemsPerPage);
174 |     $('#pagination').empty();
175 | 
176 |     for (let i = 1; i <= totalPages; i++) {
177 |         const li = $('<li>').addClass('page-item').addClass(i === currentPage ? 'active' : '');
178 |         const a = $('<a>').addClass('page-link').attr('href', `?page=${i}`).text(i);
179 |         a.on('click', function (e) {
180 |             e.preventDefault();
181 |             currentPage = i;
182 |             window.history.pushState({}, '', `?page=${i}`);
183 |             renderTable(currentPage);
184 |             renderPagination(data.length);
185 |         });
186 |         li.append(a);
187 |         $('#pagination').append(li);
188 |     }
189 | }
190 | $(document).ready(function () {
191 |     const urlParams = new URLSearchParams(window.location.search);
192 |     const pageParam = urlParams.get('page');
193 |     if (pageParam) {
194 |         currentPage = parseInt(pageParam, 10);
195 |     }
196 | 
197 |     $.ajax({
198 |         url: '/api/topics/',
199 |         type: 'GET',
200 |         success: function (response) {
201 |             data = response;
202 |             renderTable(currentPage);
203 |             renderPagination(data.length);
204 |         },
205 |         error: function () {
206 |             console.error('请求失败');
207 |         }
208 |     });
209 | });
210 | 
211 |     </script>
212 | 
213 | {% endblock %}


--------------------------------------------------------------------------------
/topics/templates/topics/pages/pagination-table.html:
--------------------------------------------------------------------------------
  1 | {% extends "topics/base.html" %}
  2 | {% load static %}
  3 | {% block title %}
  4 |     翻页表格
  5 | {% endblock %}
  6 | {% block question %}
  7 |     <h1>您好🦆, 爬虫er~👋</h1>
  8 |     <h3>
  9 |         这是一个翻页的网页，并且数据格式是表格🫣
 10 |     </h3>
 11 |     它与翻页题目没太大区别对吧，只是显示成了一个表格。<br>
 12 | {% endblock %}
 13 | {% block answer %}{% endblock %}
 14 | {% block content %}
 15 |     <div class="container mt-5">
 16 |         <h1 class="mb-4">翻页表格</h1>
 17 |         <div id="content">
 18 |             <!-- 动态内容将插入到这里 -->
 19 |         </div>
 20 |         <nav aria-label="Page navigation">
 21 |             <ul class="pagination justify-content-center">
 22 |                 <li class="page-item">
 23 |                     <a class="page-link" href="#" id="prev-page">上一页</a>
 24 |                 </li>
 25 |                 <li class="page-item">
 26 |                     <span class="page-link" id="current-page">1</span>
 27 |                 </li>
 28 |                 <li class="page-item">
 29 |                     <a class="page-link" href="#" id="next-page">下一页</a>
 30 |                 </li>
 31 |             </ul>
 32 |         </nav>
 33 |     </div>
 34 | 
 35 |     <script>
 36 |         let currentPage = 1;
 37 | 
 38 |         function fetchData(page) {
 39 |             $.ajax({
 40 |                 url: `/api/pagination_table/${page}/`, // API 接口
 41 |                 type: 'GET',
 42 |                 success: function (response) {
 43 |                     // 假设 API 返回的数据格式为：{ "data": [{ "name": "商品A", "price": 100, "image": "url", "rating": 4.5, ... }] }
 44 |                     const data = response.data;
 45 | 
 46 |                     // 创建表格头部
 47 |                     let tableHtml = `
 48 |                     <table class="table table-striped">
 49 |                         <thead>
 50 |                             <tr>
 51 |                                 <th>商品名</th>
 52 |                                 <th>品牌</th>
 53 |                                 <th>类别</th>
 54 |                                 <th>价格</th>
 55 |                                 <th>评分</th>
 56 |                                 <th>评论数</th>
 57 |                                 <th>库存</th>
 58 |                                 <th>销量</th>
 59 |                                 <th>描述</th>
 60 |                             </tr>
 61 |                         </thead>
 62 |                         <tbody>`;
 63 | 
 64 |                     // 动态生成表格行
 65 |                     data.forEach(item => {
 66 |                         tableHtml += `
 67 |                         <tr>
 68 |                             <td>${item.name}</td>
 69 |                             <td>${item.brand}</td>
 70 |                             <td>${item.category}</td>
 71 |                             <td>${item.price} 元</td>
 72 |                             <td>${item.rating} ★</td>
 73 |                             <td>${item.reviews} 条</td>
 74 |                             <td>${item.stock}</td>
 75 |                             <td>${item.sales}</td>
 76 |                             <td>${item.description}</td>
 77 |                         </tr>`;
 78 |                     });
 79 | 
 80 |                     tableHtml += `</tbody></table>`;
 81 | 
 82 |                     // 更新内容
 83 |                     $('#content').html(tableHtml);
 84 | 
 85 |                     // 更新当前页码显示
 86 |                     $('#current-page').text(page);
 87 |                 },
 88 |                 error: function () {
 89 |                     $('#content').html('<div class="alert alert-danger" role="alert">内容加载失败</div>');
 90 |                 }
 91 |             });
 92 |         }
 93 | 
 94 |         $(document).ready(function () {
 95 |             // 初始化加载第一页内容
 96 |             fetchData(currentPage);
 97 | 
 98 |             // 上一页按钮点击事件
 99 |             $('#prev-page').click(function (e) {
100 |                 e.preventDefault();
101 |                 if (currentPage > 1) {
102 |                     currentPage--;
103 |                     fetchData(currentPage);
104 |                 }
105 |             });
106 | 
107 |             // 下一页按钮点击事件
108 |             $('#next-page').click(function (e) {
109 |                 e.preventDefault();
110 |                 currentPage++;
111 |                 fetchData(currentPage);
112 |             });
113 |         });
114 |     </script>
115 | {% endblock %}
116 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/redirect.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 网页重定向
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>网页重定向</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/rowspan-table.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 跨行表格
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>跨行表格</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/spider-guide.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 爬虫学习指南
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h3>
 8 | 又又看完一篇文章之后，你还害怕爬虫吗？<br>
 9 |     请问up推荐使用的浏览器是什么浏览器？【五个汉字】
10 | </h3>
11 | {% endblock %}
12 | {% block content %}
13 | <h1>爬虫学习指南</h1>
14 |     <h3>
15 |     爬虫涉及到的学科，如何学编程，网上自学优缺点，我的学习方法和建议。
16 |     </h3>
17 | <div class="alert alert-success" role="alert">
18 | 文章在这里：<a href="https://github.com/cpython666/LearnSpider/issues/2" class="link-success" target="_blank">爬虫学习指南</a>
19 | </div>
20 | {% endblock %}
21 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/spider-roadmap.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 爬虫学习路线
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h3>
 8 | 又又又看完一篇文章之后，有没有对于爬虫更清晰一点？
 9 |     <br>
10 | 
11 | 请问：dp的全称是什么？【12个字母，其中有两个是大写】
12 | </h3>
13 | {% endblock %}
14 | {% block content %}
15 | <h1>爬虫学习路线</h1>
16 |     <h3>
17 |     爬虫的学习路线，爬虫的人生规划
18 |     </h3>
19 | <div class="alert alert-success" role="alert">
20 | 文章在这里：<a href="https://github.com/cpython666/LearnSpider/issues/4" class="link-success" target="_blank">爬虫学习路线</a>
21 | </div>
22 | {% endblock %}
23 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/svg.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | svg
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>svg</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/table-key-value.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 表格键值对获取
 5 | {% endblock %}
 6 | 
 7 | {% block content %}
 8 | <h1>表格键值对获取</h1>
 9 | 
10 | {% endblock %}
11 | 


--------------------------------------------------------------------------------
/topics/templates/topics/pages/wenjuan.html:
--------------------------------------------------------------------------------
  1 | {% extends "topics/base.html" %}
  2 | {% load static %}
  3 | {% block title %}
  4 |     自动化问卷填写
  5 | {% endblock %}
  6 | {% block question %}
  7 |     <h1>自动化问卷填写🤖</h1>
  8 |     <h3>
  9 |         解决自己的需求或者赚钱...都是一个有力的理由！🫣
 10 |     </h3>
 11 |     <p>
 12 |         小新为了一个作业，要填写几千份问卷！！！！！！<br>
 13 |         他无法想象要填写到什么时候，直到他从朋友那里得知了Python自动化...<br>
 14 |         没有花里胡哨的操作，只是拼接了一些简单基础的代码来自动化填写问卷。
 15 |     </p>
 16 | {% endblock %}
 17 | 
 18 | {% block content %}
 19 |     <!-- 示例问卷问题 -->
 20 |     <div class="question">
 21 |         <label for="q1">1. 你对Python的熟悉程度？（单选）</label><br>
 22 |         <input type="radio" name="q1" value="熟悉" id="q1-1">
 23 |         <label for="q1-1">熟悉</label><br>
 24 |         <input type="radio" name="q1" value="一般" id="q1-2">
 25 |         <label for="q1-2">一般</label><br>
 26 |         <input type="radio" name="q1" value="不熟悉" id="q1-3">
 27 |         <label for="q1-3">不熟悉</label><br>
 28 |     </div>
 29 | 
 30 |     <div class="question">
 31 |         <label for="q2">2. 你认为Python的自动化功能是否有帮助？（单选）</label><br>
 32 |         <input type="radio" name="q2" value="有帮助" id="q2-1">
 33 |         <label for="q2-1">有帮助</label><br>
 34 |         <input type="radio" name="q2" value="无帮助" id="q2-2">
 35 |         <label for="q2-2">无帮助</label><br>
 36 |         <input type="radio" name="q2" value="不确定" id="q2-3">
 37 |         <label for="q2-3">不确定</label><br>
 38 |     </div>
 39 | 
 40 |     <div class="question">
 41 |         <label for="q3">3. 请用一句话描述你对自动化填表的看法。（开放性问题）</label><br>
 42 |         <textarea name="q3" id="q3" rows="4" cols="50" placeholder="请输入你的看法"></textarea><br>
 43 |     </div>
 44 | 
 45 |     <div class="question">
 46 |         <label for="q4">4. 你通常会用Python做哪些类型的项目？（多选）</label><br>
 47 |         <input type="checkbox" name="q4" value="数据分析" id="q4-1">
 48 |         <label for="q4-1">数据分析</label><br>
 49 |         <input type="checkbox" name="q4" value="网站开发" id="q4-2">
 50 |         <label for="q4-2">网站开发</label><br>
 51 |         <input type="checkbox" name="q4" value="自动化脚本" id="q4-3">
 52 |         <label for="q4-3">自动化脚本</label><br>
 53 |         <input type="checkbox" name="q4" value="机器学习" id="q4-4">
 54 |         <label for="q4-4">机器学习</label><br>
 55 |     </div>
 56 | 
 57 |     <div class="question">
 58 |         <label for="q5">5. 你认为学习编程的最大挑战是什么？（单选）</label><br>
 59 |         <input type="radio" name="q5" value="时间管理" id="q5-1">
 60 |         <label for="q5-1">时间管理</label><br>
 61 |         <input type="radio" name="q5" value="难度理解" id="q5-2">
 62 |         <label for="q5-2">难度理解</label><br>
 63 |         <input type="radio" name="q5" value="工具使用" id="q5-3">
 64 |         <label for="q5-3">工具使用</label><br>
 65 |         <input type="radio" name="q5" value="缺乏资源" id="q5-4">
 66 |         <label for="q5-4">缺乏资源</label><br>
 67 |     </div>
 68 | 
 69 |     <div class="question">
 70 |         <label for="q6">6. 请评价你对Python编程的兴趣程度（1-5分）。（评分）</label><br>
 71 |         <select name="q6" id="q6">
 72 |             <option value="1">1 - 很低</option>
 73 |             <option value="2">2 - 较低</option>
 74 |             <option value="3">3 - 中等</option>
 75 |             <option value="4">4 - 较高</option>
 76 |             <option value="5">5 - 很高</option>
 77 |         </select><br>
 78 |     </div>
 79 | 
 80 |     <div class="question">
 81 |         <label for="q7">7. 你更喜欢哪种编程语言？（单选）</label><br>
 82 |         <input type="radio" name="q7" value="Python" id="q7-1">
 83 |         <label for="q7-1">Python</label><br>
 84 |         <input type="radio" name="q7" value="JavaScript" id="q7-2">
 85 |         <label for="q7-2">JavaScript</label><br>
 86 |         <input type="radio" name="q7" value="Java" id="q7-3">
 87 |         <label for="q7-3">Java</label><br>
 88 |         <input type="radio" name="q7" value="C++" id="q7-4">
 89 |         <label for="q7-4">C++</label><br>
 90 |     </div>
 91 | 
 92 |     <div class="question">
 93 |         <label for="q8">8. 你是否有过在Python中使用API的经验？（单选）</label><br>
 94 |         <input type="radio" name="q8" value="是" id="q8-1">
 95 |         <label for="q8-1">是</label><br>
 96 |         <input type="radio" name="q8" value="否" id="q8-2">
 97 |         <label for="q8-2">否</label><br>
 98 |     </div>
 99 | 
100 |     <div class="question">
101 |         <label for="q9">9. 如果需要编写自动化脚本，你会选择哪个框架？（单选）</label><br>
102 |         <input type="radio" name="q9" value="Selenium" id="q9-1">
103 |         <label for="q9-1">Selenium</label><br>
104 |         <input type="radio" name="q9" value="BeautifulSoup" id="q9-2">
105 |         <label for="q9-2">BeautifulSoup</label><br>
106 |         <input type="radio" name="q9" value="Requests" id="q9-3">
107 |         <label for="q9-3">Requests</label><br>
108 |         <input type="radio" name="q9" value="其他" id="q9-4">
109 |         <label for="q9-4">其他</label><br>
110 |     </div>
111 | 
112 |     <div class="question">
113 |         <label for="q10">10. 你对未来学习Python有什么期望或计划？（开放性问题）</label><br>
114 |         <textarea name="q10" id="q10" rows="4" cols="50" placeholder="请输入你的期望或计划"></textarea><br>
115 |     </div>
116 |     <div class="question">
117 |         <label for="q11">11. 你最常使用的Python库是什么？请简单说明原因。（输入框）</label><br>
118 |         <input type="text" name="q11" id="q11" placeholder="请输入库名称及原因"><br>
119 |     </div>
120 | 
121 |     <button type="submit" class="btn btn-primary" onclick="showAlert(event)">提交问卷</button>
122 |     <script>
123 |         function showAlert(event) {
124 |             event.preventDefault();  // 阻止默认表单提交行为
125 |             alert("已提交问卷");  // 弹出提示框
126 |             // 如果需要继续提交表单，可以移除下面这行注释
127 |             // event.target.submit();
128 |         }
129 |     </script>
130 | {% endblock %}
131 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/about_us.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/sandbox/news/news_base.html" %}
 2 | {% load static %}
 3 | {% block content %}
 4 |     <div class="container my-5">
 5 |         <!-- 标题 -->
 6 |         <h1 class="display-4 text-center mb-5">关于我们</h1>
 7 | 
 8 |         <!-- 应用介绍 -->
 9 |         <section class="about-introduction mb-5">
10 |             <h2 class="h3 mb-3">我们的使命</h2>
11 |             <p>
12 |                 星梦新闻致力于为用户提供最新、最全面的新闻信息。我们的目标是让用户能够随时随地了解全球范围内的热点新闻，覆盖各类领域，包括科技、娱乐、体育等。通过高效的新闻推荐和精准的搜索引擎，我们希望帮助用户更好地获取感兴趣的内容。
13 |             </p>
14 |         </section>
15 | 
16 |         <!-- 团队介绍 -->
17 |         <section class="team mb-5">
18 |             <h2 class="h3 mb-3">我们的团队</h2>
19 |             <div class="row">
20 |                 <div class="col-md-4 mb-4">
21 |                     <div class="card">
22 |                         <img src="{% static 'images/team_member1.jpg' %}" class="card-img-top" alt="团队成员1">
23 |                         <div class="card-body">
24 |                             <h5 class="card-title">张三</h5>
25 |                             <p class="card-text">项目经理，负责整体项目的规划和管理。</p>
26 |                         </div>
27 |                     </div>
28 |                 </div>
29 |                 <div class="col-md-4 mb-4">
30 |                     <div class="card">
31 |                         <img src="{% static 'images/team_member2.jpg' %}" class="card-img-top" alt="团队成员2">
32 |                         <div class="card-body">
33 |                             <h5 class="card-title">李四</h5>
34 |                             <p class="card-text">前端开发，负责用户界面的设计与开发。</p>
35 |                         </div>
36 |                     </div>
37 |                 </div>
38 |                 <div class="col-md-4 mb-4">
39 |                     <div class="card">
40 |                         <img src="{% static 'images/team_member3.jpg' %}" class="card-img-top" alt="团队成员3">
41 |                         <div class="card-body">
42 |                             <h5 class="card-title">王五</h5>
43 |                             <p class="card-text">后端开发，负责数据库和服务端的开发与优化。</p>
44 |                         </div>
45 |                     </div>
46 |                 </div>
47 |             </div>
48 |         </section>
49 | 
50 |         <!-- 联系我们 -->
51 |         <section class="contact-us mb-5">
52 |             <h2 class="h3 mb-3">联系我们</h2>
53 |             <p>如果你有任何问题或建议，欢迎通过以下方式联系我们：</p>
54 |             <ul>
55 |                 <li>电子邮件：2942581284@qq.com</li>
56 |                 <li>官方B站账号：@Python斗罗</li>
57 |                 {#                <li>客服热线：400-123-4567</li>#}
58 |             </ul>
59 |         </section>
60 |     </div>
61 | {% endblock %}
62 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/category.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/sandbox/news/news_base.html" %}
 2 | {% load static %}
 3 | {% block title %}新闻来源与类别{% endblock %}
 4 | {% block content %}
 5 |     <div class="container mt-5">
 6 |         <div class="row mt-4 d-flex justify-content-center">
 7 |             <!-- 左侧：新闻来源 -->
 8 |             <div class="col-md-4">
 9 |                 <div class="card shadow-sm mb-4">
10 |                     <div class="card-header bg-info text-white">
11 |                         <h3>新闻来源</h3>
12 |                     </div>
13 |                     <div class="card-body">
14 |                         <ul class="list-group list-group-flush">
15 |                             {% for source in sources %}
16 |                                 <li class="list-group-item">
17 |                                     <a href="{% url 'sandbox_news_source_detail' source.slug %}"
18 |                                        class="link-primary link-offset-2 link-underline-opacity-25 link-underline-opacity-100-hover">
19 |                                         <h5><i class="bi bi-browser-firefox"></i> {{ source.name }}</h5></a>
20 |                                 </li>
21 |                             {% endfor %}
22 |                         </ul>
23 |                     </div>
24 |                 </div>
25 |             </div>
26 | 
27 |             <!-- 右侧：新闻类别 -->
28 |             <div class="col-md-4">
29 |                 <div class="card shadow-sm mb-4">
30 |                     <div class="card-header bg-warning text-white">
31 |                         <h3>新闻类别</h3>
32 |                     </div>
33 |                     <div class="card-body">
34 |                         <ul class="list-group list-group-flush">
35 |                             {% for category in categories %}
36 |                                 <li class="list-group-item">
37 |                                     <a href="{% url 'sandbox_news_category_detail' category.slug %}"
38 |                                        class="link-primary link-offset-2 link-underline-opacity-25 link-underline-opacity-100-hover d-flex align-items-center">
39 |                                         <h5>
40 |                                             <i class="bi bi-robot"></i> {{ category.name }}
41 |                                         </h5></a>
42 |                                 </li>
43 |                             {% endfor %}
44 |                         </ul>
45 |                     </div>
46 |                 </div>
47 |             </div>
48 |         </div>
49 |     </div>
50 | {% endblock %}
51 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/detail_category.html:
--------------------------------------------------------------------------------
1 | {% extends "topics/sandbox/news/news_base.html" %}
2 | {% block title %}{{ category.name }} 详情{% endblock %}
3 | {% block content %}
4 |     <div class="container mt-4">
5 |         <h1>{{ category.name }}</h1>
6 |         <p>{{ category.description }}</p>
7 |     </div>
8 | {% endblock %}
9 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/detail_news.html:
--------------------------------------------------------------------------------
1 | {% extends "topics/sandbox/news/news_base.html" %}
2 | {% block content %}
3 |     <div class="container">
4 |         <h1>{{ news_item.title }}</h1>
5 |         <p>{{ news_item.content }}</p>
6 |         <a href="{% url 'sandbox_news' %}">返回首页</a>
7 |     </div>
8 | {% endblock %}
9 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/detail_source.html:
--------------------------------------------------------------------------------
1 | {% extends "topics/sandbox/news/news_base.html" %}
2 | {% block title %}{{ source.name }} 详情{% endblock %}
3 | {% block content %}
4 |     <div class="container mt-4">
5 |         <h1>{{ source.name }}</h1>
6 |         <p>{{ source.description }}</p>
7 |     </div>
8 | {% endblock %}
9 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/news_base.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}星梦新闻{% endblock %}
 4 | {% block header %}
 5 |     {% include "topics/sandbox/news/news_header.html" %}
 6 | 
 7 | {% endblock %}
 8 | {% block answer %}
 9 |     <!-- 你可以在此处添加一些其他的内容或展示区 -->
10 | {% endblock %}
11 | {% block content %}
12 |     {#    每个页面的内容#}
13 | {% endblock %}
14 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/news_header.html:
--------------------------------------------------------------------------------
 1 | {% load static %}
 2 | 
 3 | 
 4 | <nav class="navbar bg-primary navbar-expand-lg" data-bs-theme="dark">
 5 |     <div class="container-fluid">
 6 |         <a class="navbar-brand" href="/">
 7 |             <img src="{% static 'imgs/sandbox/news.jpeg' %}" alt="Bootstrap" width="40" height="40">
 8 |             <span class="navbar-brand mb-0 h1">星梦新闻</span>
 9 |         </a>
10 |         <button class="navbar-toggler" type="button" data-bs-toggle="collapse" data-bs-target="#navbarSupportedContent"
11 |                 aria-controls="navbarSupportedContent" aria-expanded="false" aria-label="Toggle navigation">
12 |             <span class="navbar-toggler-icon"></span>
13 |         </button>
14 |         <div class="collapse navbar-collapse flex-grow-0" id="navbarSupportedContent">
15 |             <ul class="navbar-nav">
16 |                 <li class="nav-item">
17 |                     <a class="nav-link" href="/sandbox/news/">
18 |                         <i class="bi bi-house-door"></i> 首页</a>
19 |                 </li>
20 |                 <li class="nav-item">
21 |                     <a class="nav-link" href="/sandbox/news/category/">
22 |                         <i class="bi bi-ui-checks-grid"></i> 分类</a>
23 |                 </li>
24 |                 <li class="nav-item">
25 |                     <a class="nav-link" href="/sandbox/news/hot/">
26 |                         <i class="bi bi-fire"></i> 热榜</a>
27 |                 </li>
28 | 
29 |                 <li class="nav-item">
30 |                     <a class="nav-link" href="/sandbox/news/category/technology/">
31 |                         <i class="bi bi-robot"></i> 科技</a>
32 |                 </li>
33 |                 <li class="nav-item">
34 |                     <a class="nav-link" href="/sandbox/news/category/web3/">
35 |                         <i class="bi bi-currency-bitcoin"></i> web3</a>
36 |                 </li>
37 |                 <li class="nav-item">
38 |                     <a class="nav-link" href="/sandbox/news/notice/">
39 |                         <i class="bi bi-bell-fill"></i> 推送通知
40 |                     </a>
41 |                 </li>
42 |                 <li class="nav-item">
43 |                     <a class="nav-link" href="/sandbox/news/about/">
44 |                         <i class="bi bi-file-earmark-person-fill"></i> 关于我们
45 |                     </a>
46 |                 </li>
47 | 
48 |                 <li class="nav-item">
49 |                     <a class="nav-link" href="https://space.bilibili.com/1909782963" target="_blank">
50 |                         <i class="bi bi-newspaper"></i>
51 |                         官方页面
52 |                         <i class="bi bi-arrow-up-right"
53 |                            style="font-size: 0.7em; position: relative; top: -7px; left: -5px;"></i>  <!-- 调整大小和位置 -->
54 |                     </a>
55 |                 </li>
56 | 
57 |                 <li class="nav-item">
58 |                     <a class="nav-link" href="https://github.com/cpython666/LearnSpider" target="_blank">
59 |                         <i class="bi-github" role="img" aria-label="GitHub"></i>
60 |                     </a>
61 |                 </li>
62 | 
63 |                 {# <li class="nav-item">#}
64 |                 {# <a class="nav-link disabled" aria-disabled="true">会员功能</a>#}
65 |                 {# </li>#}
66 |             </ul>
67 |             {# <form class="d-flex" role="search">#}
68 |             {# <input class="form-control me-2" type="search" placeholder="Search" aria-label="Search">#}
69 |             {# <button class="btn btn-outline-success" type="submit">Search</button>#}
70 |             {# </form>#}
71 |         </div>
72 |     </div>
73 | </nav>


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/news_hot.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/sandbox/news/news_base.html" %}
 2 | 
 3 | {% block title %}热榜{% endblock %}
 4 | 
 5 | {% block content %}
 6 |     <div class="container mt-4">
 7 |         <div class="row">
 8 |             {% for platform, news_list in platform_news_mapping.items %}
 9 |                 <div class="col-md-4 mb-4">
10 |                     <div class="card">
11 |                         <div class="card-header d-flex justify-content-between align-items-center">
12 |                             <h5 class="card-title mb-0">{{ platform.name }}</h5>
13 |                             <a href="{% url 'sandbox_news_hot_detail' platform.slug %}"
14 |                                class="btn btn-outline-primary btn-sm">查看更多</a>
15 |                         </div>
16 |                         <div class="card-body">
17 |                             {% if news_list %}
18 |                                 <ul class="list-group">
19 |                                     {% for news in news_list %}
20 |                                         <li class="list-group-item">
21 |                                             <!-- 使用Flex布局对齐排名和标题 -->
22 |                                             <div class="d-flex align-items-center">
23 |                                                 <span class="badge
24 | 
25 |                                                                                                             {% if forloop.counter == 1 %}bg-warning text-white{% elif forloop.counter == 2 %}bg-secondary text-white{% elif forloop.counter == 3 %}bg-success text-white{% else %}bg-light text-dark{% endif %}">
26 | {#{% if forloop.counter == 1 %}bg-warning text-white{% elif forloop.counter == 2 %}bg-secondary text-white{% elif forloop.counter == 3 %}bg-success text-white{% else %}bg-secondary text-white{% endif %}">#}
27 |                                                     {{ forloop.counter }}
28 |                                                 </span>
29 |                                                 <a href="{{ news.url }}" data-bs-toggle="tooltip"
30 |                                                    data-bs-placement="top" title="{{ news.title }}" class="ms-2">
31 |                                                     <span class="text-truncate"
32 |                                                           style="max-width: 200px; display: inline-block;">{{ news.title }}</span>
33 |                                                 </a>
34 |                                             </div>
35 |                                         </li>
36 |                                     {% endfor %}
37 |                                 </ul>
38 |                             {% else %}
39 |                                 <p class="text-muted">暂无新闻</p>
40 |                             {% endif %}
41 |                         </div>
42 |                     </div>
43 |                 </div>
44 |             {% endfor %}
45 |         </div>
46 |     </div>
47 | 
48 |     <!-- 初始化 tooltip -->
49 |     <script>
50 |         var tooltipTriggerList = [].slice.call(document.querySelectorAll('[data-bs-toggle="tooltip"]'))
51 |         var tooltipList = tooltipTriggerList.map(function (tooltipTriggerEl) {
52 |             return new bootstrap.Tooltip(tooltipTriggerEl)
53 |         })
54 |     </script>
55 | 
56 | {% endblock %}
57 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/news_hot_detail.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/sandbox/news/news_base.html" %}
 2 | 
 3 | {% block title %}热榜{% endblock %}
 4 | 
 5 | {% block content %}
 6 |     <div class="container mt-5">
 7 |         <h1 class="text-center mb-4">平台热榜</h1>
 8 | 
 9 |         <!-- 平台选择框 -->
10 |         <div class="row mb-4 justify-content-center">
11 |             <div class="col-12 text-center">
12 |                 <div class="d-flex flex-wrap justify-content-center">
13 |                     {% for platform in platforms %}
14 |                         <div class="me-2 mb-2">
15 |                             <a href="{% url 'sandbox_news_hot_detail' platform.slug %}"
16 |                                class="btn btn-outline-primary btn-sm
17 |                                {% if platform.slug == selected_platform.slug %}active{% endif %}">
18 |                                 {{ platform.name }}
19 |                             </a>
20 |                         </div>
21 |                     {% endfor %}
22 |                 </div>
23 |             </div>
24 |         </div>
25 | 
26 |         {% if selected_platform %}
27 |             <div class="row">
28 |                 <!-- 显示选中的平台热榜 -->
29 |                 <div class="col-md-12">
30 |                     <div class="card shadow-sm">
31 |                         <div class="card-header bg-primary text-white">
32 |                             <h4>{{ selected_platform.name }} 热榜</h4>
33 |                         </div>
34 |                         <div class="card-body">
35 |                             <!-- 使用栅格布局来展示新闻 -->
36 |                             <div class="row">
37 |                                 {% for news in news_lst %}
38 |                                     <div class="col-md-4 col-lg-3 mb-3">
39 |                                         <div class="card shadow-sm d-flex flex-column" style="height: 200px;">
40 |                                             <!-- 排名 -->
41 |                                             <div class="card-header text-center">
42 |                                                 <span class="badge rounded-pill
43 | 
44 |                                                         {#                                                    {% if forloop.counter == 1 %}bg-warning text-white{% elif forloop.counter == 2 %}bg-secondary text-white{% elif forloop.counter == 3 %}bg-success text-white{% else %}bg-secondary text-white{% endif %}">#}
45 |                                                                                                             {% if forloop.counter == 1 %}bg-warning text-white{% elif forloop.counter == 2 %}bg-secondary text-white{% elif forloop.counter == 3 %}bg-success text-white{% else %}bg-light text-dark{% endif %}">
46 | 
47 |                                                     {{ forloop.counter }}
48 |                                                 </span>
49 |                                             </div>
50 |                                             <div class="card-body d-flex flex-column justify-content-between">
51 |                                                 <a href="{{ news.url }}" class="text-decoration-none text-dark">
52 |                                                     <div class="card-title">{{ news.title }}</div>
53 |                                                     <p class="card-text text-muted">{{ news.published_at|date:"Y-m-d H:i" }}</p>
54 |                                                 </a>
55 |                                                 <!-- 阅读更多按钮居中 -->
56 |                                                 <div class="mt-auto text-center">
57 |                                                     <a href="{{ news.url }}"
58 |                                                        class="btn btn-outline-info btn-sm">阅读更多</a>
59 |                                                 </div>
60 |                                             </div>
61 |                                         </div>
62 |                                     </div>
63 |                                 {% empty %}
64 |                                     <div class="col-12">
65 |                                         <p class="text-center">该平台暂无热榜新闻。</p>
66 |                                     </div>
67 |                                 {% endfor %}
68 |                             </div>
69 |                         </div>
70 |                     </div>
71 |                 </div>
72 |             </div>
73 |         {% else %}
74 |             <div class="row">
75 |                 <p class="text-center">请选择一个平台来查看热榜。</p>
76 |             </div>
77 |         {% endif %}
78 |     </div>
79 | {% endblock %}
80 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/news_index.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/sandbox/news/news_base.html" %}
 2 | {% load static %}
 3 | {% block content %}
 4 |     <div class="container my-5">
 5 |         <!-- Logo 和 标题 -->
 6 |         <div class="text-center mb-5 d-flex justify-content-center align-items-center">
 7 |             <img src="{% static 'imgs/sandbox/news.jpeg' %}" alt="星梦新闻 Logo" class="img-fluid"
 8 |                  style="max-width: 150px;">
 9 |             <h1 class="display-4 mt-3">星梦新闻</h1>
10 |         </div>
11 | 
12 |         <!-- 搜索框 -->
13 |         <div class="search-box mb-5 d-flex justify-content-center">
14 |             <form action="{% url 'sandbox_news_search' %}" method="get" class="w-75 w-md-50">
15 |                 <div class="input-group">
16 |                     <input type="text" class="form-control form-control-lg" name="q" placeholder="搜索新闻..."
17 |                            aria-label="Search">
18 |                     <button class="btn btn-primary btn-lg" type="submit">搜索</button>
19 |                 </div>
20 |             </form>
21 |         </div>
22 | 
23 |         <!-- 最新热点新闻 -->
24 |         <div class="latest-news">
25 |             <h2 class="h3 mb-4 w-100 text-center">最新热点新闻</h2>
26 |             <div class="row">
27 |                 {% for news_item in latest_news %}
28 |                     <div class="col-md-4 mb-4">
29 |                         <div class="card shadow-sm">
30 |                             <div class="card-body">
31 |                                 <h5 class="card-title">
32 |                                     <a href="{% url 'sandbox_news_detail' news_item.id %}"
33 |                                        class="text-decoration-none text-dark">{{ news_item.title }}</a>
34 |                                 </h5>
35 |                                 <p class="card-text">{{ news_item.summary }}</p>
36 |                                 <small class="text-muted">{{ news_item.publish_date }}</small>
37 |                             </div>
38 |                         </div>
39 |                     </div>
40 |                 {% endfor %}
41 |             </div>
42 |         </div>
43 |     </div>
44 | {% endblock %}
45 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/notice.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/sandbox/news/news_base.html" %}
 2 | {% load static %}
 3 | {% block content %}
 4 |     <div class="container my-5 w-50">
 5 |         <h1 class="display-4 text-center mb-5">推送通知设置</h1>
 6 | 
 7 |         <!-- 通知设置 -->
 8 |         <section class="notification-settings mb-5">
 9 |             <h2 class="h3 mb-3">是否接收通知</h2>
10 |             <div class="form-check">
11 |                 <input class="form-check-input" type="checkbox" id="receive_notifications" checked>
12 |                 <label class="form-check-label" for="receive_notifications">
13 |                     接收新闻推送通知
14 |                 </label>
15 |             </div>
16 |         </section>
17 | 
18 |         <!-- 新闻偏好设置 -->
19 |         <section class="news-preferences mb-5">
20 |             <h2 class="h3 mb-3">选择您感兴趣的新闻类型</h2>
21 |             <div class="form-check">
22 |                 <input class="form-check-input" type="checkbox" id="tech_news" checked>
23 |                 <label class="form-check-label" for="tech_news">
24 |                     科技
25 |                 </label>
26 |             </div>
27 |             <div class="form-check">
28 |                 <input class="form-check-input" type="checkbox" id="entertainment_news">
29 |                 <label class="form-check-label" for="entertainment_news">
30 |                     娱乐
31 |                 </label>
32 |             </div>
33 |             <div class="form-check">
34 |                 <input class="form-check-input" type="checkbox" id="sports_news">
35 |                 <label class="form-check-label" for="sports_news">
36 |                     体育
37 |                 </label>
38 |             </div>
39 |             <div class="form-check">
40 |                 <input class="form-check-input" type="checkbox" id="web3_news">
41 |                 <label class="form-check-label" for="web3_news">
42 |                     Web3
43 |                 </label>
44 |             </div>
45 |         </section>
46 | 
47 |         <!-- 订阅套餐选择 -->
48 |         <section class="subscription-package mb-5">
49 |             <h2 class="h3 mb-3">选择订阅套餐</h2>
50 |             <div class="form-group">
51 |                 <label for="subscription_package">选择套餐</label>
52 |                 <select class="form-control" id="subscription_package">
53 |                     <option value="basic">基础套餐 - 每日一次推送</option>
54 |                     <option value="premium">高级套餐 - 每小时推送</option>
55 |                     <option value="vip">VIP套餐 - 实时推送</option>
56 |                 </select>
57 |             </div>
58 |         </section>
59 | 
60 |         <!-- 保存设置按钮 -->
61 |         <div class="text-center">
62 |             <button class="btn btn-primary" id="save-settings">保存设置</button>
63 |         </div>
64 |     </div>
65 | 
66 | {% endblock %}
67 | 


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/technology.html:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/templates/topics/sandbox/news/technology.html


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/news/web3.html:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/templates/topics/sandbox/news/web3.html


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/wallpaper/wallpaper.html:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/templates/topics/sandbox/wallpaper/wallpaper.html


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/wallpaper/wallpaper_base.html:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/templates/topics/sandbox/wallpaper/wallpaper_base.html


--------------------------------------------------------------------------------
/topics/templates/topics/sandbox/wallpaper/wallpaper_header.html:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/templates/topics/sandbox/wallpaper/wallpaper_header.html


--------------------------------------------------------------------------------
/topics/templates/topics/solutions.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {% load static %}
 3 | {% block title %}题解{% endblock %}
 4 | 
 5 | {% block answer %}
 6 | {% endblock %}
 7 | 
 8 | {% block content %}
 9 |     <div class="container text-center flex-column mt-1">
10 |         <img src="{% static 'imgs/logo.jpeg' %}" class="img-thumbnail" style="width: 250px;" alt="...">
11 |         <div class="h1 m-1">
12 |             题解
13 |         </div>
14 |     </div>
15 | {% endblock %}


--------------------------------------------------------------------------------
/topics/templates/topics/tools/encode.html:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpython666/LearnSpider/c86901bb0e6066fe9f60030c861b24828d35e0f7/topics/templates/topics/tools/encode.html


--------------------------------------------------------------------------------
/topics/templates/topics/views/encode.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | {#{% block charset %}<meta charset="GB2312"> {% endblock %}#}
 3 | {#{% block charset %}<meta charset="ISO-8859-1"> {% endblock %}#}
 4 | {#{% block charset %}<meta charset="UTF-8"> {% endblock %}#}
 5 | {% block title %}
 6 | 网页编码
 7 | {% endblock %}
 8 | {% block question %}
 9 | <h1>您好🦆, 爬虫er~👋</h1>
10 |     <h3>
11 |     尝试用requests请求这个页面，查看结果是否有什么不一样呢？<br>
12 |     尝试解决它！【可以看教程的奥】<br>
13 |     请回答：【解决了】
14 |     </h3>
15 | {% endblock %}
16 | 
17 | {% block content %}
18 |    <p>有的网页编码是gbk，有的是utf-8，也有的是一些变种比如ISO-8859-1等等。当你的解码方法与网页的编码方法不同的时候，就会产生乱码。所以，如何判断知道网页的编码呢？</p>
19 | {% endblock %}
20 | 


--------------------------------------------------------------------------------
/topics/templates/topics/views/hello-spider.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | 
 4 | {% block title %}
 5 | Hello，爬虫！
 6 | {% endblock %}
 7 | {% block question %}
 8 | <h1>您好🦆, 爬虫er~👋</h1>
 9 |     <h3>
10 |     请问，这个页面有多少个：《Hello, Spider~》？【ps：题目中的这个不算！】
11 | 
12 |     </h3>
13 | {% endblock %}
14 | 
15 | {% block content %}
16 |     {% for greeting, button_class in greeting_buttons %}
17 |         <button type="button" class="{{ button_class }}">{{ greeting }}</button>
18 |     {% endfor %}
19 | {% endblock %}
20 | 


--------------------------------------------------------------------------------
/topics/templates/topics/views/request-twice-cookie.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | <html lang="en">
 3 | 
 4 | <head>
 5 |     <meta charset="UTF-8">
 6 |     <title>Request-Twice</title>
 7 | </head>
 8 | 
 9 | <body>
10 |     <script type="text/javascript">
11 |         // 设置 Cookie
12 |         var cookieName = 'timestamp';
13 |         var cookieValue = new Date().getTime() / 1000; // 当前时间戳（秒）
14 |         var cookieExpiration = new Date(new Date().getTime() + 1000); // 过期时间为一秒后
15 |         document.cookie = cookieName + '=' + cookieValue + '; expires=' + cookieExpiration.toUTCString() + '; path=/';
16 |         // 重新加载页面
17 |         window.location.reload();
18 |     </script>
19 | </body>
20 | 
21 | </html>


--------------------------------------------------------------------------------
/topics/templates/topics/views/request-twice.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | 
 4 | {% block title %}
 5 | cookie反爬-pro
 6 | {% endblock %}
 7 | {% block question %}
 8 | <h1>您好🦆, 爬虫er~👋</h1>
 9 |     <h3>
10 |     请问，你用代码获取到这个页面的源代码了吗？
11 |     </h3>
12 | {% endblock %}
13 | 
14 | {% block content %}
15 |     {% for greeting, button_class in greeting_buttons %}
16 |         <button type="button" class="{{ button_class }}">{{ greeting }}</button>
17 |     {% endfor %}
18 | {% endblock %}
19 | 


--------------------------------------------------------------------------------
/topics/templates/topics/views/table.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | 表格求和
 5 | {% endblock %}
 6 | {% block question %}
 7 | <h1>您好🦆, 爬虫er~👋</h1>
 8 |     <h3>
 9 |     请问，表格中所有数字的总和为多少？【ctrl+f搜不到了吧，哈哈😂】
10 | 
11 |     </h3>
12 | {% endblock %}
13 | 
14 | {% block content %}
15 | 
16 |     <div class="container">
17 |         <h1 class="mt-5">表格求和</h1>
18 |         <table class="table table-bordered mt-3">
19 |             <thead>
20 |                 <tr>
21 |                     {% for col in table_data.0 %}
22 |                         <th>列{{ forloop.counter }}</th>
23 |                     {% endfor %}
24 |                 </tr>
25 |             </thead>
26 |             <tbody>
27 |                 {% for row in table_data %}
28 |                     <tr>
29 |                         {% for cell in row %}
30 |                             <td>{{ cell }}</td>
31 |                         {% endfor %}
32 |                     </tr>
33 |                 {% endfor %}
34 |             </tbody>
35 |         </table>
36 |     </div>
37 | {% endblock %}
38 | 


--------------------------------------------------------------------------------
/topics/templates/topics/views/ua.html:
--------------------------------------------------------------------------------
 1 | {% extends "topics/base.html" %}
 2 | 
 3 | {% block title %}
 4 | UA检测
 5 | {% endblock %}
 6 | 
 7 | {% block question %}
 8 | <h1>您好🦆, 爬虫er~👋</h1>
 9 |     <h3>
10 |     请问，你用代码获取到这个页面的源代码了吗？[老实点🥸]<br>
11 |     请回答：【获取到了】
12 |     </h3>
13 | {% endblock %}
14 | 
15 | {% block content %}
16 | <p>小新第一次请求之后成功获取了网页的源代码，虽然不知道网络的各种原理，但是还是很有成就感的，只是...这就是爬虫吗，就这么简单？尝试下这个网页吧！</p>
17 | {% endblock %}
18 | 


--------------------------------------------------------------------------------
/topics/tests.py:
--------------------------------------------------------------------------------
1 | from django.test import TestCase
2 | 
3 | # Create your tests here.
4 | 


--------------------------------------------------------------------------------
/topics/urls.py:
--------------------------------------------------------------------------------
 1 | from django.urls import path
 2 | from . import views
 3 | from django.urls import path
 4 | from .views import topic_view
 5 | 
 6 | urlpatterns = [
 7 |     path("", views.index, name="index"),
 8 |     path("list", views.list, name="list"),
 9 |     path("tools", views.tools, name="tools"),
10 |     path("shorthand", views.shorthand, name="shorthand"),
11 |     path("solutions", views.solutions, name="solutions"),
12 |     # ------------------ 试金场 -----------------
13 |     path("sandbox/", views.sandbox, name="sandbox"),
14 |     path("sandbox/news/", views.sandbox_news, name="sandbox_news"),
15 |     path("sandbox/news/search/", views.sandbox_news, name="sandbox_news_search"),
16 |     path(
17 |         "sandbox/news/about/", views.sandbox_news_about_us, name="sandbox_news_about_us"
18 |     ),  # 关于我们页面
19 |     path("sandbox/news/notice/", views.sandbox_news_notice, name="sandbox_news_notice"),
20 |     path(
21 |         "sandbox/news/category/",
22 |         views.sandbox_news_category,
23 |         name="sandbox_news_category",
24 |     ),
25 |     path(
26 |         "sandbox/news/category/<slug:slug>/",
27 |         views.sandbox_news_category_detail,
28 |         name="sandbox_news_category_detail",
29 |     ),
30 |     # 详情页面路由
31 |     path(
32 |         "sandbox/news/source/<slug:slug>/",
33 |         views.sandbox_news_source_detail,
34 |         name="sandbox_news_source_detail",
35 |     ),
36 |     # path('news/category/<slug:slug>/', views.category_detail, name='category_detail'),
37 |     path("sandbox/news/hot/", views.sandbox_news_hot, name="sandbox_news_hot"),
38 |     path(
39 |         "sandbox/news/hot/<slug:slug>/",
40 |         views.sandbox_news_hot_detail,
41 |         name="sandbox_news_hot_detail",
42 |     ),
43 |     path("sandbox/news/category/technology/", views.sandbox_news, name="sandbox_news"),
44 |     path("sandbox/news/category/web3/", views.sandbox_news, name="sandbox_news"),
45 |     path(
46 |         "sandbox/news/news_detail/<int:id>/",
47 |         views.sandbox_news_detail,
48 |         name="sandbox_news_detail",
49 |     ),
50 |     # ------------------------------------------
51 |     # topic开头 重定向到视图返回 /html pages静态页面类型
52 |     path("page/<str:response_path>/", topic_view, name="topic_view"),
53 |     # ------------------------------------------
54 |     # 请求视图类型
55 |     path("view/hello-spider/", views.hello_spider, name="request_twice"),
56 |     path("view/request-twice/", views.request_twice, name="request-twice"),
57 |     path("view/ua/", views.ua, name="ua"),
58 |     path("view/encode/", views.encode_page, name="encode"),
59 |     path("view/table/", views.table, name="table"),
60 |     # 混合请求接口类型
61 |     path("demo/", views.demo),
62 |     path("demo1/", views.demo1),
63 | ]
64 | 


--------------------------------------------------------------------------------
/topics/views.py:
--------------------------------------------------------------------------------
  1 | from django.shortcuts import get_object_or_404
  2 | from datetime import datetime
  3 | from .models import Topics, NewsPlatform, News, NewsCategory, NewsRequestHistory
  4 | from .decorators import require_ua
  5 | import time
  6 | import random
  7 | from django.shortcuts import render
  8 | 
  9 | 
 10 | def demo(request):
 11 |     return render(request, "topics/pages/demo_get_server_time.html")
 12 | 
 13 | 
 14 | def demo1(request):
 15 |     return render(request, "topics/pages/demo.html")
 16 | 
 17 | 
 18 | def hello_spider(request):  # random_greetings
 19 |     greetings = []
 20 |     button_classes = [
 21 |         "btn btn-primary",
 22 |         "btn btn-secondary",
 23 |         "btn btn-success",
 24 |         "btn btn-danger",
 25 |         "btn btn-warning",
 26 |         "btn btn-info",
 27 |         "btn btn-light",
 28 |         "btn btn-dark",
 29 |         "btn btn-link",
 30 |     ]
 31 |     # 随机生成 666 个 "Hello, Spider~"
 32 |     for _ in range(666):
 33 |         greetings.append("Hello, Spider~")
 34 |     # 随机生成 "你好～世界！" 的数量（例如，随机 1 到 100 个）
 35 |     nihao_count = random.randint(1, 100)
 36 |     for _ in range(nihao_count):
 37 |         greetings.append("你好～世界！")
 38 |     # 随机生成 "Hello, World～" 的数量（例如，随机 1 到 100 个）
 39 |     hello_world_count = random.randint(1, 100)
 40 |     for _ in range(hello_world_count):
 41 |         greetings.append("Hello, World～")
 42 |     # 为每个 greeting 随机选择一个按钮样式
 43 |     greeting_buttons = [
 44 |         (greeting, random.choice(button_classes)) for greeting in greetings
 45 |     ]
 46 |     # 打乱顺序
 47 |     random.shuffle(greeting_buttons)
 48 | 
 49 |     return render(
 50 |         request,
 51 |         "topics/views/hello-spider.html",
 52 |         {"greeting_buttons": greeting_buttons},
 53 |     )
 54 | 
 55 | 
 56 | @require_ua
 57 | def ua(request):
 58 |     return render(request, "topics/views/ua.html")
 59 | 
 60 | 
 61 | def encode_page(request):
 62 |     response = render(request, "topics/views/encode.html")
 63 |     response["Content-Type"] = "text/html;"
 64 |     # response['Content-Type'] = 'text/html; charset=GB2312'
 65 |     # response['Content-Type'] = 'text/html;UTF-8'
 66 |     # response['Content-Type'] = 'text/html; charset=ISO-8859-1'
 67 |     return response
 68 | 
 69 | 
 70 | def table(request):
 71 |     # 定义行数和列数，这里可以随机生成，或者根据你的需求来确定
 72 |     rows = random.randint(5, 10)
 73 |     cols = random.randint(5, 10)
 74 | 
 75 |     # 生成随机的表格数据，确保总和为666666
 76 |     total_sum = 666666
 77 |     table_data = [[0] * cols for _ in range(rows)]
 78 |     remaining_sum = total_sum
 79 | 
 80 |     for r in range(rows):
 81 |         for c in range(cols):
 82 |             if r == rows - 1 and c == cols - 1:
 83 |                 table_data[r][c] = remaining_sum  # 最后一个单元格填充剩余的数值
 84 |             else:
 85 |                 # 确保 max_value 始终大于等于 1
 86 |                 max_value = max(1, remaining_sum - (rows - r - 1) * (cols - c - 1))
 87 |                 value = random.randint(1, max_value)
 88 |                 table_data[r][c] = value
 89 |                 remaining_sum -= value
 90 | 
 91 |     context = {"table_data": table_data}
 92 |     return render(request, "topics/views/table.html", context)
 93 | 
 94 | 
 95 | def request_twice(request):
 96 |     # get_content_or_script
 97 |     # 设定 Cookie 的过期时间为一秒
 98 |     # 考虑到以下几点，仍然进行过期时间的判断是一个更健壮的设计：
 99 |     # 浏览器行为不一致: 不同浏览器可能在处理过期Cookie时有不同的行为，有些可能不会立即删除。
100 |     # 用户行为不确定: 用户可能会手动修改浏览器时间，或者在极端情况下，浏览器可能不会及时删除过期的Cookie。
101 |     # 潜在的安全问题: 不信任客户端数据的完整性始终是一个好的安全实践。
102 |     # 因此，尽管浏览器应该删除过期的Cookie，后端进行过期时间的验证仍然是推荐的做法，以确保系统的可靠性和安全性。
103 |     COOKIE_NAME = "timestamp"
104 |     COOKIE_EXPIRATION = 1  # 秒
105 |     # 读取 Cookie
106 |     cookie_value = request.COOKIES.get(COOKIE_NAME)
107 |     if cookie_value:
108 |         try:
109 |             # 验证 Cookie 是否过期
110 |             cookie_timestamp = float(cookie_value)
111 |             current_time = time.time()
112 |             if current_time - cookie_timestamp <= COOKIE_EXPIRATION:
113 |                 # 如果 Cookie 仍然有效，返回 HTML 内容
114 |                 return render(request, "topics/views/request-twice.html")
115 |         except ValueError:
116 |             pass
117 |     # 如果没有有效的 Cookie，返回 JavaScript 代码来设置 Cookie
118 |     return render(request, "topics/views/request-twice-cookie.html")
119 | 
120 | 
121 | def index(request):
122 |     return render(request, "topics/index/index.html")
123 | 
124 | 
125 | def list(request):
126 |     return render(request, "topics/index/list.html")
127 | 
128 | 
129 | def tools(request):
130 |     return render(request, "topics/index/tools.html")
131 | 
132 | 
133 | def sandbox(request):
134 |     return render(request, "topics/index/sandbox.html")
135 | 
136 | 
137 | def sandbox_news(request):
138 |     # 模拟一些假新闻数据
139 |     latest_news = [
140 |         {
141 |             "id": 1,
142 |             "title": "新科技革命：AI 将重塑未来",
143 |             "summary": "随着 AI 技术的飞速发展，未来的科技将发生翻天覆地的变化...",
144 |             "publish_date": datetime.now().strftime("%Y-%m-%d"),
145 |         },
146 |         {
147 |             "id": 2,
148 |             "title": "2025年全球互联网将迎来新变革",
149 |             "summary": "在未来几年，全球互联网将经历一场前所未有的革命...",
150 |             "publish_date": datetime.now().strftime("%Y-%m-%d"),
151 |         },
152 |         {
153 |             "id": 3,
154 |             "title": "量子计算的突破性进展",
155 |             "summary": "量子计算作为一种新型计算模式，正在逐步突破技术瓶颈...",
156 |             "publish_date": datetime.now().strftime("%Y-%m-%d"),
157 |         },
158 |         {
159 |             "id": 4,
160 |             "title": "5G网络加速全球数字化进程",
161 |             "summary": "5G网络的普及正在改变全球通信格局，推动各行各业的数字化转型...",
162 |             "publish_date": datetime.now().strftime("%Y-%m-%d"),
163 |         },
164 |         {
165 |             "id": 5,
166 |             "title": "未来科技：机器人将进入家庭生活",
167 |             "summary": "随着人工智能和机器人技术的发展，智能机器人正在进入普通家庭...",
168 |             "publish_date": datetime.now().strftime("%Y-%m-%d"),
169 |         },
170 |     ]
171 | 
172 |     return render(
173 |         request,
174 |         "topics/sandbox/news/news_index.html",
175 |         {"latest_news": latest_news, "search": "/sandbox/news/search"},
176 |     )
177 | 
178 | 
179 | # 模拟分类和新闻数据
180 | categories = [
181 |     {
182 |         "id": 1,
183 |         "char_name": "technology",
184 |         "name": "科技",
185 |         "news": [
186 |             {
187 |                 "id": 1,
188 |                 "title": "AI 的未来",
189 |                 "summary": "探索人工智能的最新发展...",
190 |                 "publish_date": "2025-02-13",
191 |             },
192 |             {
193 |                 "id": 2,
194 |                 "title": "5G 网络的全球影响",
195 |                 "summary": "5G 网络带来的技术革新...",
196 |                 "publish_date": "2025-02-12",
197 |             },
198 |         ],
199 |     },
200 |     {
201 |         "id": 2,
202 |         "char_name": "happy",
203 |         "name": "娱乐",
204 |         "news": [
205 |             {
206 |                 "id": 3,
207 |                 "title": "明星动态：新电影发布",
208 |                 "summary": "最新电影上映，明星动态...",
209 |                 "publish_date": "2025-02-14",
210 |             },
211 |             {
212 |                 "id": 4,
213 |                 "title": "2025年超级碗回顾",
214 |                 "summary": "今年超级碗的精彩瞬间...",
215 |                 "publish_date": "2025-02-10",
216 |             },
217 |         ],
218 |     },
219 |     {
220 |         "id": 3,
221 |         "char_name": "sport",
222 |         "name": "体育",
223 |         "news": [
224 |             {
225 |                 "id": 5,
226 |                 "title": "足球世界杯的传奇时刻",
227 |                 "summary": "回顾世界杯历史上的经典时刻...",
228 |                 "publish_date": "2025-02-11",
229 |             },
230 |             {
231 |                 "id": 6,
232 |                 "title": "NBA 历史最佳球员排名",
233 |                 "summary": "NBA 球员排名持续更新...",
234 |                 "publish_date": "2025-02-09",
235 |             },
236 |         ],
237 |     },
238 |     {
239 |         "id": 4,
240 |         "char_name": "web3",
241 |         "name": "Web3",
242 |         "news": [
243 |             {
244 |                 "id": 7,
245 |                 "title": "Web3：去中心化互联网的崛起",
246 |                 "summary": "Web3 作为去中心化的互联网理念，正在改变许多行业...",
247 |                 "publish_date": "2025-02-15",
248 |             },
249 |             {
250 |                 "id": 8,
251 |                 "title": "NFT 的未来：如何定义数字所有权",
252 |                 "summary": "NFT 已成为区块链中的一个重要领域，它带来了数字资产的革命...",
253 |                 "publish_date": "2025-02-14",
254 |             },
255 |             {
256 |                 "id": 9,
257 |                 "title": "DeFi：去中心化金融的现状与未来",
258 |                 "summary": "DeFi 带来了无银行的金融模式，它能否挑战传统金融体系？",
259 |                 "publish_date": "2025-02-13",
260 |             },
261 |         ],
262 |     },
263 | ]
264 | 
265 | 
266 | def sandbox_news_category(request):
267 |     # 模拟数据：新闻来源平台和新闻类别
268 |     sources = [
269 |         {"name": "抖音", "slug": "douyin"},
270 |         {"name": "B站", "slug": "bilibili"},
271 |         {"name": "知乎", "slug": "zhihu"},
272 |     ]
273 |     # 模拟数据：新闻类别
274 |     categories = [
275 |         {"name": "国际新闻", "slug": "international"},
276 |         {"name": "国内新闻", "slug": "domestic"},
277 |         {"name": "科技新闻", "slug": "technology"},
278 |         {"name": "体育新闻", "slug": "sports"},
279 |         {"name": "娱乐新闻", "slug": "entertainment"},
280 |     ]
281 | 
282 |     # 将数据传递到模板
283 |     return render(
284 |         request,
285 |         "topics/sandbox/news/category.html",
286 |         {"sources": sources, "categories": categories},
287 |     )
288 | 
289 | 
290 | def sandbox_news_category_detail(request, slug):
291 |     # 模拟数据：新闻类别详情
292 |     categories_details = {
293 |         "international": {
294 |             "name": "国际新闻",
295 |             "description": "全球范围内的新闻热点，聚焦国际局势。",
296 |         },
297 |         "domestic": {
298 |             "name": "国内新闻",
299 |             "description": "关注本国的时事新闻，涵盖社会、政治、经济等各个方面。",
300 |         },
301 |         "technology": {
302 |             "name": "科技新闻",
303 |             "description": "报道最新的科技趋势、创新产品和技术突破。",
304 |         },
305 |         "sports": {
306 |             "name": "体育新闻",
307 |             "description": "关注体育赛事、运动员动态及全球体育新闻。",
308 |         },
309 |         "entertainment": {
310 |             "name": "娱乐新闻",
311 |             "description": "报道娱乐圈的最新动态、明星资讯、影视作品等。",
312 |         },
313 |     }
314 | 
315 |     category = categories_details.get(slug, {})
316 |     return render(
317 |         request, "topics/sandbox/news/detail_category.html", {"category": category}
318 |     )
319 | 
320 | 
321 | def sandbox_news_source_detail(request, slug):
322 |     # 模拟数据：来源平台详情
323 |     sources_details = {
324 |         "douyin": {
325 |             "name": "抖音",
326 |             "description": "抖音是一款短视频分享社交平台，用户可以发布和观看短视频。",
327 |         },
328 |         "bilibili": {
329 |             "name": "B站",
330 |             "description": "B站是一家以二次元文化为主的在线视频平台，提供丰富的视频内容。",
331 |         },
332 |         "zhihu": {
333 |             "name": "知乎",
334 |             "description": "知乎是一个知识分享和问答社区，汇集了大量专业内容和用户互动。",
335 |         },
336 |     }
337 | 
338 |     source = sources_details.get(slug, {})
339 |     print(source)
340 |     return render(request, "topics/sandbox/news/detail_source.html", {"source": source})
341 | 
342 | 
343 | def sandbox_news_hot(request):
344 |     platforms = NewsPlatform.objects.all()
345 |     # 第一次查询，获取所有数据行的 id 和 platform_id
346 |     res = {}
347 |     first_query_results = NewsRequestHistory.objects.order_by("-id").values(
348 |         "id", "platform_id"
349 |     )[: 2 * len(platforms)]
350 |     for _ in first_query_results[::-1]:
351 |         res[_["platform_id"]] = _["id"]
352 |     # 使用 ids 查询真实数据
353 |     latest_records = NewsRequestHistory.objects.filter(id__in=res.values())
354 |     id_news_mapping = {}
355 |     # 将日志对象映射到新闻数据
356 |     for log_obj in latest_records:
357 |         id_news_mapping[log_obj.platform_id] = log_obj.response_data[:10]
358 |     # 为每个平台添加新闻数据
359 |     platform_news_mapping = {}
360 |     for platform in platforms:
361 |         platform_news_mapping[platform] = id_news_mapping.get(platform.id, [])
362 |     # 将平台及其对应的新闻传递给模板
363 |     return render(
364 |         request,
365 |         "topics/sandbox/news/news_hot.html",
366 |         {
367 |             "platform_news_mapping": platform_news_mapping,
368 |         },
369 |     )
370 | 
371 | 
372 | def sandbox_news_hot_detail(request, slug):
373 |     platforms = NewsPlatform.objects.all()
374 |     news = None
375 |     if slug:
376 |         selected_platform = NewsPlatform.objects.get(slug=slug)
377 |         log_obj = (
378 |             NewsRequestHistory.objects.filter(platform_id=selected_platform.id)
379 |             .order_by("-id")
380 |             .first()
381 |         )
382 |         news = log_obj.response_data
383 |     else:
384 |         selected_platform = None
385 | 
386 |     return render(
387 |         request,
388 |         "topics/sandbox/news/news_hot_detail.html",
389 |         {
390 |             "platforms": platforms,
391 |             "selected_platform": selected_platform,
392 |             "news_lst": news,
393 |         },
394 |     )
395 | 
396 | 
397 | def hot_news_detail_view(request, id):
398 |     ...
399 |     # news = get_object_or_404(HotNews, id=id)
400 |     # return render(request, 'hot_news_detail.html', {'news': news})
401 | 
402 | 
403 | def sandbox_news_detail(request, id):
404 |     # 假设根据id获取新闻，实际上只是返回假数据
405 |     news_item = {
406 |         "id": id,
407 |         "title": f"新闻 {id} 详情",
408 |         "content": "这是新闻的详细内容，更多的细节信息可以在这里展示。",
409 |     }
410 |     return render(
411 |         request, "topics/sandbox/news/detail_news.html", {"news_item": news_item}
412 |     )
413 | 
414 | 
415 | def sandbox_news_about_us(request):
416 |     return render(request, "topics/sandbox/news/about_us.html")
417 | 
418 | 
419 | def sandbox_news_notice(request):
420 |     return render(request, "topics/sandbox/news/notice.html")
421 | 
422 | 
423 | def shorthand(request):
424 |     return render(request, "topics/index/shorthand.html")
425 | 
426 | 
427 | def solutions(request):
428 |     return render(request, "topics/solutions.html")
429 | 
430 | 
431 | def topic_view(request, response_path):
432 |     # 根据 path 获取对应的题目
433 |     topic = get_object_or_404(Topics, response_path=response_path)
434 |     # 返回对应的 HTML 视图
435 |     return render(request, "topics/pages/" + response_path + ".html", {"topic": topic})
436 | 
437 | 
438 | def error404(request, exception):
439 |     return render(request, "topics/404.html", status=404)
440 | 


--------------------------------------------------------------------------------