Spaces:

DjangoPeng
/

GitHubSentinel

Sleeping

App Files Files Community

DjangoPeng commited on Sep 27, 2024

Commit

3851ff8

1 Parent(s): e5c7047

add GitHubSentinel v0.8.2

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

Dockerfile +24 -0
LICENSE +201 -0
README-EN.md +318 -0
README.md +307 -1
build_image.sh +16 -0
config.json +29 -0
daemon_control.sh +75 -0
daily_progress/langchain-ai_langchain/.ipynb_checkpoints/2024-08-18-checkpoint.md +36 -0
docs/ollama.md +195 -0
docs/unit_test.md +169 -0
images/build_docker_image.jpg +0 -0
images/gradio_demo.png +0 -0
images/gradio_v0.8_github.png +0 -0
images/gradio_v0.8_hn.png +0 -0
logs/DaemonProcess.log +0 -0
logs/app.2024-09-20_10-00-00_575591.log +0 -0
logs/app.log +0 -0
prompts/github_ollama_prompt.txt +23 -0
prompts/github_openai_prompt.txt +22 -0
prompts/hacker_news_daily_report_ollama_prompt.txt +37 -0
prompts/hacker_news_daily_report_openai_prompt.txt +35 -0
prompts/hacker_news_hours_topic_ollama_prompt.txt +24 -0
prompts/hacker_news_hours_topic_openai_prompt.txt +24 -0
requirements.txt +6 -0
src/__pycache__/cli.cpython-311.pyc +0 -0
src/__pycache__/command_handler.cpython-310.pyc +0 -0
src/__pycache__/config.cpython-310.pyc +0 -0
src/__pycache__/config.cpython-311.pyc +0 -0
src/__pycache__/config.cpython-312.pyc +0 -0
src/__pycache__/email_notifier.cpython-311.pyc +0 -0
src/__pycache__/github_client.cpython-310.pyc +0 -0
src/__pycache__/github_client.cpython-311.pyc +0 -0
src/__pycache__/github_client.cpython-312.pyc +0 -0
src/__pycache__/hacker_news_client.cpython-310.pyc +0 -0
src/__pycache__/llm.cpython-310.pyc +0 -0
src/__pycache__/logger.cpython-310.pyc +0 -0
src/__pycache__/logger.cpython-312.pyc +0 -0
src/__pycache__/notifier.cpython-310.pyc +0 -0
src/__pycache__/notifier.cpython-311.pyc +0 -0
src/__pycache__/report_generator.cpython-310.pyc +0 -0
src/__pycache__/report_generator.cpython-311.pyc +0 -0
src/__pycache__/scheduler.cpython-310.pyc +0 -0
src/__pycache__/scheduler.cpython-311.pyc +0 -0
src/__pycache__/scheduler.cpython-312.pyc +0 -0
src/__pycache__/subscription_manager.cpython-310.pyc +0 -0
src/__pycache__/subscription_manager.cpython-311.pyc +0 -0
src/command_handler.py +85 -0
src/command_tool.py +38 -0
src/config.py +34 -0
src/daemon_process.py +94 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,24 @@

+# Dockerfile
+# 使用官方的 Python 基础镜像
+FROM python:3.10-slim
+# 设置工作目录
+WORKDIR /app
+# 复制 requirements.txt 并安装依赖
+COPY requirements.txt .
+# 安装 Python 依赖
+RUN pip install --no-cache-dir -r requirements.txt
+# 复制项目的所有文件到容器
+COPY . .
+# 复制并执行 validate_tests.sh 脚本
+COPY validate_tests.sh .
+RUN chmod +x validate_tests.sh
+RUN ./validate_tests.sh
+# 设置容器入口
+CMD ["python", "src/daemon_process.py"]

LICENSE ADDED Viewed

	@@ -0,0 +1,201 @@

+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+   1. Definitions.
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+   END OF TERMS AND CONDITIONS
+   APPENDIX: How to apply the Apache License to your work.
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+   Copyright [yyyy] [name of copyright owner]
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+       http://www.apache.org/licenses/LICENSE-2.0
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.

README-EN.md ADDED Viewed

	@@ -0,0 +1,318 @@

+---
+title: GitHubSentinel
+emoji: 👀
+colorFrom: gray
+colorTo: yellow
+sdk: gradio
+sdk_version: 4.42.0
+app_file: app.py
+pinned: false
+license: apache-2.0
+---
+# GitHub Sentinel
+![GitHub stars](https://img.shields.io/github/stars/DjangoPeng/GitHubSentinel?style=social)
+![GitHub forks](https://img.shields.io/github/forks/DjangoPeng/GitHubSentinel?style=social)
+![GitHub watchers](https://img.shields.io/github/watchers/DjangoPeng/GitHubSentinel?style=social)
+![GitHub repo size](https://img.shields.io/github/repo-size/DjangoPeng/GitHubSentinel)
+![GitHub language count](https://img.shields.io/github/languages/count/DjangoPeng/GitHubSentinel)
+![GitHub top language](https://img.shields.io/github/languages/top/DjangoPeng/GitHubSentinel)
+![GitHub last commit](https://img.shields.io/github/last-commit/DjangoPeng/GitHubSentinel?color=red)
+<p align="center">
+    <br> <a href="README.md">中文</a> | English
+</p>
+## Table of Contents
+- [GitHub Sentinel](#github-sentinel)
+- [Key Features](#key-features)
+- [Product Screenshot](#product-screenshot)
+- [Quick Start](#quick-start)
+  - [1. Install Dependencies](#1-install-dependencies)
+  - [2. Configure the Application](#2-configure-the-application)
+  - [3. How to Run](#3-how-to-run)
+    - [A. Run as a Command Line Tool](#a-run-as-a-command-line-tool)
+    - [B. Run as a Background Service](#b-run-as-a-background-service)
+    - [C. Run as a Gradio Server](#c-run-as-a-gradio-server)
+- [Ollama Installation and Service Deployment](#ollama-installation-and-service-deployment)
+- [Unit Testing](#unit-testing)
+  - [Unit Testing and Validation Script `validate_tests.sh`](#unit-testing-and-validation-script-validate_testssh)
+    - [Purpose](#purpose)
+    - [Functionality](#functionality)
+- [Building and Validating with Docker](#building-and-validating-with-docker)
+  - [1. `Dockerfile`](#1-dockerfile)
+    - [Purpose](#purpose)
+    - [Key Steps](#key-steps)
+  - [2. `build_image.sh`](#2-build_imagesh)
+    - [Purpose](#purpose)
+    - [Functionality](#functionality)
+- [Contributing](#contributing)
+- [License](#license)
+- [Contact](#contact)
+GitHub Sentinel is an `AI Agent` designed for the era of large language models (LLMs), specializing in intelligent information retrieval and high-value content extraction. It is tailored for users with high-frequency and large-scale information needs, such as open-source enthusiasts, individual developers, and investors.
+### Key Features
+- **Subscription Management**: Easily manage and track your subscribed GitHub repositories.
+- **Update Retrieval**: Automatically fetch and aggregate the latest updates from your subscribed repositories, including commits, issues, and pull requests.
+- **Notification System**: Receive real-time notifications via email about the latest project progress.
+- **Report Generation**: Generate detailed project progress reports based on the retrieved updates, supporting various formats and templates to meet different needs.
+- **Multi-Model Support**: Leverage OpenAI and Ollama models to generate natural language project reports, offering more intelligent and accurate information services.
+- **Scheduled Tasks**: Supports scheduled tasks running as a daemon process, ensuring timely retrieval of updates.
+- **Graphical Interface**: Provides a simple and user-friendly GUI based on Gradio, making it accessible to a wider audience.
+- **Containerization**: The project supports Docker build and containerized deployment, allowing quick and easy setup in different environments.
+- **Continuous Integration**: Comprehensive unit tests are implemented, facilitating the configuration of production-level CI/CD pipelines to ensure project stability and high-quality delivery.
+GitHub Sentinel not only helps users automatically track and analyze the progress of `GitHub open-source projects` but also extends its capabilities to other information sources, such as trending topics on `Hacker News`, providing a more comprehensive approach to information extraction and analysis.
+### Product Screenshot
+**GitHub Project Tracking and Summary**
+![gradio_v0.8_github](images/gradio_v0.8_github.png)
+**Hacker News Trending Tech Topic Mining**
+![gradio_v0.8_hn](images/gradio_v0.8_hn.png)
+## Quick Start
+### 1. Install Dependencies
+First, install the required dependencies:
+```sh
+pip install -r requirements.txt
+```
+### 2. Configure the Application
+Edit the `config.json` file to set up your GitHub Token, Email settings (using Tencent WeCom Email as an example), subscription file, update settings, large model service configurations (supporting OpenAI GPT API and Ollama private large model service) and report types autogenerated by LLMs:
+```json
+{
+    "github": {
+        "token": "your_github_token",
+        "subscriptions_file": "subscriptions.json",
+        "progress_frequency_days": 1,
+        "progress_execution_time": "08:00"
+    },
+    "email":  {
+        "smtp_server": "smtp.exmail.qq.com",
+        "smtp_port": 465,
+        "from": "from_email@example.com",
+        "password": "your_email_password",
+        "to": "to_email@example.com"
+    },
+    "llm": {
+        "model_type": "ollama",
+        "openai_model_name": "gpt-4o-mini",
+        "ollama_model_name": "llama3",
+        "ollama_api_url": "http://localhost:11434/api/chat"
+    },
+    "report_types": [
+        "github",
+        "hacker_news_hours_topic",
+        "hacker_news_daily_report"
+    ],
+    "slack": {
+        "webhook_url": "your_slack_webhook_url"
+    }
+}
+```
+**For security reasons:** The GitHub Token and Email Password settings support using environment variables to avoid configuring sensitive information in plain text, as shown below:
+```shell
+# Github
+export GITHUB_TOKEN="github_pat_xxx"
+# Email
+export EMAIL_PASSWORD="password"
+```
+### 3. How to Run
+GitHub Sentinel supports the following three running modes:
+#### A. Run as a Command Line Tool
+You can run the application interactively from the command line:
+```sh
+python src/command_tool.py
+```
+In this mode, you can manually input commands to manage subscriptions, retrieve updates, and generate reports.
+#### B. Run as a Background Service
+To run the application as a background service (daemon process), it will automatically update periodically according to the relevant configuration.
+You can directly use the daemon management script [daemon_control.sh](daemon_control.sh) to start, check the status, stop, and restart:
+1. Start the service:
+    ```sh
+    $ ./daemon_control.sh start
+    Starting DaemonProcess...
+    DaemonProcess started.
+    ```
+   - This will start [./src/daemon_process.py], which will periodically generate reports and send emails according to the update frequency and time point set in `config.json`.
+   - The service log will be saved to the `logs/DaemonProcess.log` file. At the same time, historical cumulative logs will also be appended to the `logs/app.log` log file.
+2. Check the service status:
+    ```sh
+    $ ./daemon_control.sh status
+    DaemonProcess is running.
+    ```
+3. Stop the service:
+    ```sh
+    $ ./daemon_control.sh stop
+    Stopping DaemonProcess...
+    DaemonProcess stopped.
+    ```
+4. Restart the service:
+    ```sh
+    $ ./daemon_control.sh restart
+    Stopping DaemonProcess...
+    DaemonProcess stopped.
+    Starting DaemonProcess...
+    DaemonProcess started.
+    ```
+#### C. Run as a Gradio Server
+To run the application with a Gradio interface, allowing users to interact with the tool via a web interface:
+```sh
+python src/gradio_server.py
+```
+![gradio_v0.8_github](images/gradio_v0.8_github.png)
+![gradio_v0.8_hn](images/gradio_v0.8_hn.png)
+- This will start a web server on your machine, allowing you to manage subscriptions and generate reports through a user-friendly interface.
+- By default, the Gradio server will be accessible at `http://localhost:7860`, but it can be shared publicly if needed.
+## Ollama Installation and Service Deployment
+Ollama is a private large model management tool that supports local and containerized deployment, command-line interaction, and REST API calls.
+For detailed instructions on Ollama installation and private large model service deployment, please refer to [Ollama Installation and Service Deployment](docs/ollama.md).
+### Ollama Brief Official Installation
+To use Ollama for calling private large model services in GitHub Sentinel, follow these steps for installation and configuration:
+1. **Install Ollama**:
+   Download and install the Ollama service according to the official Ollama documentation. Ollama supports multiple operating systems, including Linux, Windows, and macOS.
+2. **Start the Ollama Service**:
+   After installation, start the Ollama service with the following command:
+   ```bash
+   ollama serve
+   ```
+   By default, the Ollama API will run on `http://localhost:11434`.
+3. **Configure Ollama for Use in GitHub Sentinel**:
+   In the `config.json` file, configure the relevant information for the Ollama API:
+   ```json
+   {
+       "llm": {
+           "model_type": "ollama",
+           "ollama_model_name": "llama3",
+           "ollama_api_url": "http://localhost:11434/api/chat"
+       }
+   }
+   ```
+4. **Validate the Configuration**:
+   Start GitHub Sentinel and generate a report with the following command to verify that the Ollama configuration is correct:
+   ```bash
+   python src/command_tool.py
+   ```
+   If the configuration is correct, you will be able to generate reports using the Ollama model.
+## Unit Testing
+To ensure the quality and reliability of the code, GitHub Sentinel uses the `unittest` module for unit testing. For detailed explanations of `unittest` and related tools (such as `@patch` and `MagicMock`), please refer to [Detailed Unit Test Explanation](docs/unit_test.md).
+### Unit Testing and Validation Script `validate_tests.sh`
+#### Purpose
+`validate_tests.sh` is a shell script used to run unit tests and validate the results. It is executed during the Docker image build process to ensure the correctness and stability of the code.
+#### Functionality
+- The script runs all unit tests and outputs the results to the `test_results.txt` file.
+- If the tests fail, the script outputs the test results and causes the Docker build to fail.
+- If all tests pass, the script continues the build process.
+## Building and Validating with Docker
+To facilitate building and deploying the GitHub Sentinel project in various environments, we provide Docker support. This support
+ includes the following files and functionalities:
+### 1. `Dockerfile`
+#### Purpose
+The `Dockerfile` is a configuration file used to define how to build a Docker image. It describes the steps to build the image, including installing dependencies, copying project files, running unit tests, etc.
+#### Key Steps
+- Use `python:3.10-slim` as the base image and set the working directory to `/app`.
+- Copy the project's `requirements.txt` file and install Python dependencies.
+- Copy all project files to the container and grant execution permission to the `validate_tests.sh` script.
+- During the build process, execute the `validate_tests.sh` script to ensure that all unit tests pass. If the tests fail, the build process will be aborted.
+- After a successful build, the container will default to running `src/main.py` as the entry point.
+### 2. `build_image.sh`
+#### Purpose
+`build_image.sh` is a shell script used to automatically build a Docker image. It retrieves the branch name from the current Git branch and uses it as the tag for the Docker image, facilitating the generation of different Docker images on different branches.
+#### Functionality
+- Retrieve the current Git branch name and use it as the tag for the Docker image.
+- Use the `docker build` command to build the Docker image and tag it with the current Git branch name.
+#### Usage Example
+```bash
+chmod +x build_image.sh
+./build_image.sh
+```
+![build_docker_image](images/build_docker_image.jpg)
+With these scripts and configuration files, you can ensure that Docker images built in different development branches are based on code that has passed unit tests, thereby improving code quality and deployment reliability.
+## Contributing
+Contributions make the open-source community a wonderful place to learn, inspire, and create. Any contributions you make are **greatly appreciated**. If you have any suggestions or feature requests, please start an issue to discuss what you would like to change.
+<a href='https://github.com/repo-reviews/repo-reviews.github.io/blob/main/create.md' target="_blank"><img alt='Github' src='https://img.shields.io/badge/review_me-100000?style=flat&logo=Github&logoColor=white&labelColor=888888&color=555555'/></a>
+## License
+This project is licensed under the terms of the Apache-2.0 License. See the [LICENSE](LICENSE) file for details.
+## Contact
+Django Peng - pjt73651@email.com
+Project Link: https://github.com/DjangoPeng/GitHubSentinel

README.md CHANGED Viewed

@@ -10,4 +10,310 @@ pinned: false
 license: apache-2.0
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 license: apache-2.0
 ---
+# GitHub Sentinel
+![GitHub stars](https://img.shields.io/github/stars/DjangoPeng/GitHubSentinel?style=social)
+![GitHub forks](https://img.shields.io/github/forks/DjangoPeng/GitHubSentinel?style=social)
+![GitHub watchers](https://img.shields.io/github/watchers/DjangoPeng/GitHubSentinel?style=social)
+![GitHub repo size](https://img.shields.io/github/repo-size/DjangoPeng/GitHubSentinel)
+![GitHub language count](https://img.shields.io/github/languages/count/DjangoPeng/GitHubSentinel)
+![GitHub top language](https://img.shields.io/github/languages/top/DjangoPeng/GitHubSentinel)
+![GitHub last commit](https://img.shields.io/github/last-commit/DjangoPeng/GitHubSentinel?color=red)
+<p align="center">
+    <br> <a href="README-EN.md">English</a> | 中文
+</p>
+## 目录
+- [GitHub Sentinel](#github-sentinel)
+- [主要功能](#主要功能)
+- [产品截图](#产品截图)
+- [快速开始](#快速开始)
+  - [1. 安装依赖](#1-安装依赖)
+  - [2. 配置应用](#2-配置应用)
+  - [3. 如何运行](#3-如何运行)
+    - [A. 作为命令行工具运行](#a-作为命令行工具运行)
+    - [B. 作为后台服务运行](#b-作为后台服务运行)
+    - [C. 作为 Gradio 服务器运行](#c-作为-gradio-服务器运行)
+- [Ollama 安装与服务发布](#Ollama-安装与服务发布)
+- [单元测试](#单元测试)
+  - [单元测试和验证脚本 `validate_tests.sh`](#单元测试和验证脚本-validate_testssh)
+    - [用途](#用途)
+    - [功能](#功能)
+- [使用 Docker 构建与验证](#使用-docker-构建与验证)
+  - [1. `Dockerfile`](#1-dockerfile)
+    - [用途](#用途)
+    - [关键步骤](#关键步骤)
+  - [2. `build_image.sh`](#2-build_imagesh)
+    - [用途](#用途)
+    - [功能](#功能)
+- [贡献](#贡献)
+- [许可证](#许可证)
+- [联系](#联系)
+GitHub Sentinel 是专为大模型（LLMs）时代打造的智能信息检索和高价值内容挖掘 `AI Agent`。它面向那些需要高频次、大量信息获取的用户，特别是开源爱好者、个人开发者和投资人等。
+### 主要功能
+- **订阅管理**：轻松管理和跟踪您关注的 GitHub 仓库。
+- **更新检索**：自动检索并汇总订阅仓库的最新动态，包括提交记录、问题和拉取请求。
+- **通知系统**：通过电子邮件等方式，实时通知订阅者项目的最新进展。
+- **报告生成**：基于检索到的更新生成详细的项目进展报告，支持多种格式和模板，满足不同需求。
+- **多模型支持**：结合 OpenAI 和 Ollama 模型，生成自然语言项目报告，提供更智能、精准的信息服务。
+- **定时任务**：支持以守护进程方式执行定时任务，确保信息更新及时获取。
+- **图形化界面**：基于 Gradio 实现了简单易用的 GUI 操作模式，降低使用门槛。
+- **容器化**：项目支持 Docker 构建和容器化部署，便于在不同环境中快速部署和运行。
+- **持续集成**：实现了完备的单元测试，便于进一步配置生产级 CI/CD 流程，确保项目的稳定性和高质量交付。
+GitHub Sentinel 不仅能帮助用户自动跟踪和分析 `GitHub 开源项目` 的最新动态，还能快速扩展到其他信息渠道，如 `Hacker News` 的热门话题，提供更全面的信息挖掘与分析能力。
+### 产品截图
+**GitHub 项目进度跟踪与总结**
+![gradio_v0.8_github](images/gradio_v0.8_github.png)
+**Hacker News 热门技术话题挖掘**
+![gradio_v0.8_hn](images/gradio_v0.8_hn.png)
+## 快速开始
+### 1. 安装依赖
+首先，安装所需的依赖项：
+```sh
+pip install -r requirements.txt
+```
+### 2. 配置应用
+编辑 `config.json` 文件，以设置您的 GitHub Token、Email 设置（以腾讯企微邮箱为例）、订阅文件、更新设置，大模型服务配置（支持 OpenAI GPT API 和 Ollama 私有化大模型服务）,以及自动检索和生成的报告类型（GitHub项目进展， Hacker News 热门话题和前沿技术趋势）：
+```json
+{
+    "github": {
+        "token": "your_github_token",
+        "subscriptions_file": "subscriptions.json",
+        "progress_frequency_days": 1,
+        "progress_execution_time": "08:00"
+    },
+    "email":  {
+        "smtp_server": "smtp.exmail.qq.com",
+        "smtp_port": 465,
+        "from": "from_email@example.com",
+        "password": "your_email_password",
+        "to": "to_email@example.com"
+    },
+    "llm": {
+        "model_type": "ollama",
+        "openai_model_name": "gpt-4o-mini",
+        "ollama_model_name": "llama3",
+        "ollama_api_url": "http://localhost:11434/api/chat"
+    },
+    "report_types": [
+        "github",
+        "hacker_news_hours_topic",
+        "hacker_news_daily_report"
+    ],
+    "slack": {
+        "webhook_url": "your_slack_webhook_url"
+    }
+}
+```
+**出于安全考虑:** GitHub Token 和 Email Password 的设置均支持使用环境变量进行配置，以避免明文配置重要信息，如下所示：
+```shell
+# Github
+export GITHUB_TOKEN="github_pat_xxx"
+# Email
+export EMAIL_PASSWORD="password"
+```
+### 3. 如何运行
+GitHub Sentinel 支持以下三种运行方式：
+#### A. 作为命令行工具运行
+您可以从命令行交互式地运行该应用：
+```sh
+python src/command_tool.py
+```
+在此模式下，您可以手动输入命令来管理订阅、检索更新和生成报告。
+#### B. 作为后台服务运行
+要将该应用作为后台服务（守护进程）运行，它将根据相关配置定期自动更新。
+您可以直接使用守护进程管理脚本 [daemon_control.sh](daemon_control.sh) 来启动、查询状态、关闭和重启：
+1. 启动服务：
+    ```sh
+    $ ./daemon_control.sh start
+    Starting DaemonProcess...
+    DaemonProcess started.
+    ```
+   - 这将启动[./src/daemon_process.py]，按照 `config.json` 中设置的更新频率和时间点定期生成报告，并发送邮件。
+   - 本次服务日志将保存到 `logs/DaemonProcess.log` 文件中。同时，历史累计日志也将同步追加到 `logs/app.log` 日志文件中。
+2. 查询服务状态：
+    ```sh
+    $ ./daemon_control.sh status
+    DaemonProcess is running.
+    ```
+3. 关闭服务：
+    ```sh
+    $ ./daemon_control.sh stop
+    Stopping DaemonProcess...
+    DaemonProcess stopped.
+    ```
+4. 重启服务：
+    ```sh
+    $ ./daemon_control.sh restart
+    Stopping DaemonProcess...
+    DaemonProcess stopped.
+    Starting DaemonProcess...
+    DaemonProcess started.
+    ```
+#### C. 作为 Gradio 服务器运行
+要使用 Gradio 界面运行应用，允许用户通过 Web 界面与该工具交互：
+```sh
+python src/gradio_server.py
+```
+- 这将在您的机器上启动一个 Web 服务器，允许您通过用户友好的界面管理订阅和生成报告。
+- 默认情况下，Gradio 服务器将可在 `http://localhost:7860` 访问，但如果需要，您可以公开共享它。
+## Ollama 安装与服务发布
+Ollama 是一个私有化大模型管理工具，支持本地和容器化部署，命令行交互和 REST API 调用。
+关于 Ollama 安装部署与私有化大模型服务发布的详细说明，请参考[Ollama 安装部署与服务发布](docs/ollama.md)。
+### Ollama 简要官方安装
+要在 GitHub Sentinel 中使用 Ollama 调用私有化大模型服务，请按照以下步骤进行安装和配置：
+1. **安装 Ollama**：
+   请根据 Ollama 的官方文档下载并安装 Ollama 服务。Ollama 支持多种操作系统，包括 Linux、Windows 和 macOS。
+2. **启动 Ollama 服务**：
+   安装完成后，通过以下命令启动 Ollama 服务：
+   ```bash
+   ollama serve
+   ```
+   默认情况下，Ollama API 将在 `http://localhost:11434` 运行。
+3. **配置 Ollama 在 GitHub Sentinel 中使用**：
+   在 `config.json` 文件中，配置 Ollama API 的相关信息：
+   ```json
+   {
+       "llm": {
+           "model_type": "ollama",
+           "ollama_model_name": "llama3",
+           "ollama_api_url": "http://localhost:11434/api/chat"
+       }
+   }
+   ```
+4. **验证配置**：
+   使用以下命令启动 GitHub Sentinel 并生成报告，以验证 Ollama 配置是否正确：
+   ```bash
+   python src/command_tool.py
+   ```
+   如果配置正确，您将能够通过 Ollama 模型生成报告。
+## 单元测试
+为了确保代码的质量和可靠性，GitHub Sentinel 使用了 `unittest` 模块进行单元测试。关于 `unittest` 及其相关工具（如 `@patch` 和 `MagicMock`）的详细说明，请参考 [单元测试详细说明](docs/unit_test.md)。
+### 单元测试和验证脚本 `validate_tests.sh`
+#### 用途
+`validate_tests.sh` 是一个用于运行单元测试并验证结果的 Shell 脚本。它在 Docker 镜像构建过程中被执行，以确保代码的正确性和稳定性。
+#### 功能
+- 脚本运行所有单元测试，并将结果输出到 `test_results.txt` 文件中。
+- 如果测试失败，脚本会输出测试结果并导致 Docker 构建失败。
+- 如果所有测试通过，脚本会继续构建过程。
+## 使用 Docker 构建与验证
+为了便于在各种环境中构建和部署 GitHub Sentinel 项目，我们提供了 Docker 支持。该支持包括以下文件和功能：
+### 1. `Dockerfile`
+#### 用途
+`Dockerfile` 是用于定义如何构建 Docker 镜像的配置文件。它描述了镜像的构建步骤，包括安装依赖、复制项目文件、运行单元测试等。
+#### 关键步骤
+- 使用 `python:3.10-slim` 作为基础镜像，并设置工作目录为 `/app`。
+- 复制项目的 `requirements.txt` 文件并安装 Python 依赖。
+- 复制项目的所有文件到容器，并赋予 `validate_tests.sh` 脚本执行权限。
+- 在构建过程中执行 `validate_tests.sh` 脚本，以确保所有单元测试通过。如果测试失败，��建过程将中止。
+- 构建成功后，将默认运行 `src/main.py` 作为容器的入口点。
+### 2. `build_image.sh`
+#### 用途
+`build_image.sh` 是一个用于自动构建 Docker 镜像的 Shell 脚本。它从当前的 Git 分支获取分支名称，并将其用作 Docker 镜像的标签，便于在不同分支上生成不同的 Docker 镜像。
+#### 功能
+- 获取当前的 Git 分支名称，并将其用作 Docker 镜像的标签。
+- 使用 `docker build` 命令构建 Docker 镜像，并使用当前 Git 分支名称作为标签。
+#### 使用示例
+```bash
+chmod +x build_image.sh
+./build_image.sh
+```
+![build_docker_image](images/build_docker_image.jpg)
+通过这些脚本和配置文件，确保在不同的开发分支中，构建的 Docker 镜像都是基于通过单元测试的代码，从而提高了代码质量和部署的可靠性。
+## 贡献
+贡献是使开源社区成为学习、激励和创造的惊人之处。非常感谢你所做的任何贡献。如果你有任何建议或功能请求，请先开启一个议题讨论你想要改变的内容。
+<a href='https://github.com/repo-reviews/repo-reviews.github.io/blob/main/create.md' target="_blank"><img alt='Github' src='https://img.shields.io/badge/review_me-100000?style=flat&logo=Github&logoColor=white&labelColor=888888&color=555555'/></a>
+## 许可证
+该项目根据 Apache-2.0 许可证的条款进行许可。详情请参见 [LICENSE](LICENSE) 文件。
+## 联系
+Django Peng - pjt73651@email.com
+项目链接: https://github.com/DjangoPeng/GitHubSentinel

build_image.sh ADDED Viewed

	@@ -0,0 +1,16 @@

+#!/bin/bash
+# 获取当前的 Git 分支名称
+BRANCH_NAME=$(git rev-parse --abbrev-ref HEAD)
+# 如果需要，可以处理分支名称，例如替换无效字符
+BRANCH_NAME=${BRANCH_NAME//\//-}
+# 使用 Git 分支名称作为 Docker 镜像的标签
+IMAGE_TAG="github_sentinel:${BRANCH_NAME}"
+# 构建 Docker 镜像
+docker build -t $IMAGE_TAG .
+# 输出构建结果
+echo "Docker 镜像已构建并打上标签: $IMAGE_TAG"

config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+    "github": {
+        "token": "your_github_token",
+        "subscriptions_file": "subscriptions.json",
+        "progress_frequency_days": 1,
+        "progress_execution_time": "08:00"
+    },
+    "email":  {
+        "smtp_server": "smtp.exmail.qq.com",
+        "smtp_port": 465,
+        "from": "pjt@zaijidata.com",
+        "password": "",
+        "to": "test@zaijidata.com"
+    },
+    "llm": {
+        "model_type": "ollama",
+        "openai_model_name": "gpt-4o-mini",
+        "ollama_model_name": "llama3.1",
+        "ollama_api_url": "http://localhost:11434/api/chat"
+    },
+    "report_types": [
+        "github",
+        "hacker_news_hours_topic",
+        "hacker_news_daily_report"
+    ],
+    "slack": {
+        "webhook_url": "your_slack_webhook_url"
+    }
+}

daemon_control.sh ADDED Viewed

	@@ -0,0 +1,75 @@

+#!/bin/bash
+# 守护进程控制脚本
+# 定义守护进程 Python 脚本的路径
+DAEMON_PATH="./src/daemon_process.py"
+# 定义守护进程的名称
+DAEMON_NAME="DaemonProcess"
+# 定义日志文件的路径
+LOG_FILE="./logs/$DAEMON_NAME.log"
+# 定义守护进程的 PID 文件路径，用于存储进程号
+PID_FILE="./run/$DAEMON_NAME.pid"
+# 启动守护进程的函数
+start() {
+    echo "Starting $DAEMON_NAME..."
+    # 使用 nohup 命令在后台运行 Python 脚本，并将输出重定向到日志文件
+    nohup python3 $DAEMON_PATH > $LOG_FILE 2>&1 &
+    # 将守护进程的 PID 写入文件
+    echo $! > $PID_FILE
+    echo "$DAEMON_NAME started."
+}
+# 停止守护进程的函数
+stop() {
+    if [ -f $PID_FILE ]; then
+        # 如果 PID 文件存在，读取 PID
+        PID=$(cat $PID_FILE)
+        echo "Stopping $DAEMON_NAME..."
+        # 使用 kill 命令停止进程
+        kill $PID
+        echo "$DAEMON_NAME stopped."
+        # 删除 PID 文件
+        rm $PID_FILE
+    else
+        echo "$DAEMON_NAME is not running."
+    fi
+}
+# 检查守护进程状态的函数
+status() {
+    if [ -f $PID_FILE ]; then
+        PID=$(cat $PID_FILE)
+        # 检查进程是否在运行
+        if ps -p $PID > /dev/null
+        then
+           echo "$DAEMON_NAME is running."
+        else
+           echo "$DAEMON_NAME is not running."
+        fi
+    else
+        echo "$DAEMON_NAME is not running."
+    fi
+}
+# 根据输入参数选择执行哪个函数
+case "$1" in
+    start)
+        start
+        ;;
+    stop)
+        stop
+        ;;
+    status)
+        status
+        ;;
+    restart)
+        # 重启守护进程
+        stop
+        start
+        ;;
+    *)
+        # 如果参数不符合预期，显示用法
+        echo "Usage: $0 {start|stop|status|restart}"
+        exit 1
+esac

daily_progress/langchain-ai_langchain/.ipynb_checkpoints/2024-08-18-checkpoint.md ADDED Viewed

	@@ -0,0 +1,36 @@

+# Daily Progress for langchain-ai/langchain (2024-08-18)
+## Issues Closed Today
+## Pull Requests Merged Today
+- docs: add prompt to install nltk #25519
+- docs: add prompt to install beautifulsoup4. #25518
+- add embeddings integration tests #25508
+- docs: fix Databricks Vector Search demo notebook #25504
+- openai[patch]: update core dep #25502
+- core[patch]: Release 0.2.33 #25498
+- openai[patch]: Release 0.1.22 #25496
+- docs: use .invoke rather than __call__ in openai integration notebook #25494
+- openai[patch]: fix json mode for Azure #25488
+- langchain-box: add langchain box package and DocumentLoader #25465
+- docs: fix mimetype parser docstring #25463
+- langchain-box: Add DocumentLoader #25458
+- core[minor], anthropic[patch]: Upgrade @root_validator usage to be consistent with pydantic 2 #25457
+- voyageai[patch]: Upgrade root validators for pydantic 2 #25455
+- ai21[patch]: Upgrade @root_validators for pydantic 2 migration #25454
+- pinecone[patch]: Upgrade @root_validators to be consistent with pydantic 2 #25453
+- docs: `arxiv` page update #25450
+- docs: format oai embeddings docstring #25448
+- docs: fix api ref mod links in pkg page #25447
+- mistralai[patch]: Update more @root_validators for pydantic 2 compatibility #25446
+- docs[patch]: Update code that checks API keys #25444
+- fireworks[patch]: Upgrade @root_validators to be pydantic 2 compliant  #25443
+- docs[patch]: Fix integration notebook for Fireworks llm #25442
+- experimental: Fix divide by 0 error #25439
+- community[patch]: update connection string in azure cosmos integration test #25438
+- convert _DocumentWithState to Document in ContextualCompressionRetriever, #25432
+- [docs]: pdf loaders #25425
+- docs[patch]: Fix a few typos in the chat integration docs for TogetherAI #25424
+- together[patch]: Update @root_validator for pydantic 2 compatibility #25423
+- langchain: bump core to 0.2.32 #25421

docs/ollama.md ADDED Viewed

	@@ -0,0 +1,195 @@

+## Ollama 安装部署与服务发布
+### Linux
+```bash
+curl -fsSL https://ollama.com/install.sh | sh
+```
+[手动安装说明](https://github.com/ollama/ollama/blob/main/docs/linux.md)
+### macOS
+[下载](https://ollama.com/download/Ollama-darwin.zip)
+### Windows 预览版
+[下载](https://ollama.com/download/OllamaSetup.exe)
+---
+## 快速入门
+要运行并与 [Llama 3.1](https://ollama.com/library/llama3.1) 进行对话：
+```bash
+ollama run llama3.1
+```
+---
+## 模型库
+Ollama 支持在 [ollama.com/library](https://ollama.com/library) 上提供的一系列模型。
+以下是一些可以下载的示例模型：
+| 模型               | 参数  | 大小  | 下载命令                       |
+| ------------------ | ----- | ----- | ------------------------------ |
+| Llama 3.1          | 8B    | 4.7GB | `ollama run llama3.1`          |
+| Llama 3.1          | 70B   | 40GB  | `ollama run llama3.1:70b`      |
+| Llama 3.1          | 405B  | 231GB | `ollama run llama3.1:405b`     |
+| Phi 3 Mini         | 3.8B  | 2.3GB | `ollama run phi3`              |
+| Phi 3 Medium       | 14B   | 7.9GB | `ollama run phi3:medium`       |
+| Gemma 2            | 2B    | 1.6GB | `ollama run gemma2:2b`         |
+| Gemma 2            | 9B    | 5.5GB | `ollama run gemma2`            |
+| Gemma 2            | 27B   | 16GB  | `ollama run gemma2:27b`        |
+| Mistral            | 7B    | 4.1GB | `ollama run mistral`           |
+| Moondream 2        | 1.4B  | 829MB | `ollama run moondream`         |
+| Neural Chat        | 7B    | 4.1GB | `ollama run neural-chat`       |
+| Starling           | 7B    | 4.1GB | `ollama run starling-lm`       |
+| Code Llama         | 7B    | 3.8GB | `ollama run codellama`         |
+| Llama 2 Uncensored | 7B    | 3.8GB | `ollama run llama2-uncensored` |
+| LLaVA              | 7B    | 4.5GB | `ollama run llava`             |
+| Solar              | 10.7B | 6.1GB | `ollama run solar`             |
+---
+### 命令行工具
+#### 创建模型
+`ollama create` 用于从 Modelfile 创建模型。
+```bash
+ollama create mymodel -f ./Modelfile
+```
+#### 拉取模型
+```bash
+ollama pull llama3.1
+```
+> 此命令还可用于更新本地模型。仅会拉取差异部分。
+#### 删除模型
+```bash
+ollama rm llama3.1
+```
+#### 复制模型
+```bash
+ollama cp llama3.1 my-model
+```
+#### 多行输入
+对于多行输入，可以使用 `"""` 包裹文本：
+```bash
+>>> """Hello,
+... world!
+... """
+```
+这将输出一个包含“Hello, world!”消息的简单程序。
+#### 多模态模型
+```bash
+ollama run llava "这张图片中有什么？ /Users/jmorgan/Desktop/smile.png"
+```
+图像中显示的是一个黄色的笑脸，可能是图片的中心焦点。
+#### 以参数传递提示
+```bash
+$ ollama run llama3.1 "总结此文件: $(cat README.md)"
+```
+Ollama 是一个轻量级、可扩展的框架，用于在本地计算机上构建和运行语言模型。
+---
+### REST API
+Ollama 提供 REST API 来运行和管理模型。
+#### 生成响应
+```bash
+curl http://localhost:11434/api/generate -d '{
+  "model": "llama3.1",
+  "prompt":"为什么天空是蓝色的？"
+}'
+```
+#### 与模型对话
+```bash
+curl http://localhost:11434/api/chat -d '{
+  "model": "llama3.1",
+  "messages": [
+    { "role": "user", "content": "为什么天空是蓝色的？" }
+  ]
+}'
+```
+有关所有端点（Endpoint）的详细信息，请参阅 [API 文档](./docs/api.md)。
+---
+### Docker 支持
+Ollama 官方提供了 Docker 镜像 `ollama/ollama`，可以在 Docker Hub 上找到。
+#### 使用 CPU 运行
+```bash
+docker run -d -v ollama:/root/.ollama -p 11434:11434 --name ollama ollama/ollama
+```
+#### 使用 Nvidia GPU 运行
+要使用 Nvidia GPU，首先需要安装 NVIDIA Container Toolkit：
+```bash
+# 配置仓库
+curl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | sudo gpg --dearmor -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg
+curl -s -L https://nvidia.github.io/libnvidia-container/stable/deb/nvidia-container-toolkit.list | sed 's#deb https://#deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://#g' | sudo tee /etc/apt/sources.list.d/nvidia-container-toolkit.list
+sudo apt-get update
+# 安装 NVIDIA Container Toolkit 包
+sudo apt-get install -y nvidia-container-toolkit
+# 配置 Docker 使用 Nvidia 驱动
+sudo nvidia-ctk runtime configure --runtime=docker
+sudo systemctl restart docker
+```
+启动容器：
+```bash
+docker run -d --gpus=all -v ollama:/root/.ollama -p 11434:11434 --name ollama ollama/ollama
+```
+#### 使用 AMD GPU 运行
+要使用 AMD GPU 运行 Ollama，可以使用 `rocm` 标签，并运行以下命令：
+```bash
+docker run -d --device /dev/kfd --device /dev/dri -v ollama:/root/.ollama -p 11434:11434 --name ollama ollama/ollama:rocm
+```
+### 本地运行模型
+现在，你可以运行一个模型：
+```bash
+docker exec -it ollama ollama run llama3
+```
+---
+请根据以上内容进行 Ollama 的安装和配置，使用 CLI 工具和 Docker 镜像来管理和运行各种模型。如需更多信息，请访问 [Ollama GitHub 仓库](https://github.com/ollama/ollama)。

docs/unit_test.md ADDED Viewed

	@@ -0,0 +1,169 @@

+# 单元测试详细说明
+- [单元测试详细说明](#单元测试详细说明)
+  - [unittest.TestCase 单元测试样例](#unittesttestcase-单元测试样例)
+    - [主要功能和特点](#主要功能和特点)
+    - [使用示例](#使用示例)
+  - [@patch 装饰器详细](#patch-装饰器详细)
+    - [主要参数](#主要参数)
+    - [使用场景](#使用场景)
+    - [在 test_subscription_manager.py 中的应用](#在-test_subscription_managerpy-中的应用)
+    - [其他常见用法](#其他常见用法)
+    - [小结](#小结)
+  - [MagicMock 模拟工具](#magicmock-模拟工具)
+    - [主要功能和特点](#主要功能和特点)
+    - [在 test_report_generator.py 中的应用](#在-test_report_generatorpy-中的应用)
+    - [小结](#小结)
+## `unittest.TestCase` 单元测试样例
+`unittest.TestCase` 是所有测试类的基类，它为测试提供了丰富的断言方法和测试工具。通过继承 `unittest.TestCase`，可以创建自己的测试类，并定义测试方法来验证代码的行为。
+### 主要功能和特点
+1. **断言方法**：
+   - `assertEqual(a, b)`：检查 `a` 和 `b` 是否相等。
+   - `assertTrue(x)`：检查 `x` 是否为 `True`。
+   - `assertFalse(x)`：检查 `x` 是否为 `False`。
+   - `assertRaises(Exception, func, *args, **kwargs)`：检查是否抛出指定的异常。
+2. **测试方法的命名**：
+   - 在 `TestCase` 类中，以 `test_` 开头的方法将被自动识别为测试方法，并在运行测试时自动执行。
+3. **设置和清理**：
+   - `setUp()`：在每个测试方法运行之前执行，用于初始化测试环境。
+   - `tearDown()`：在每个测试方法运行之后执行，用于清理测试环境。
+### 使用示例
+```python
+import unittest
+class MyTestCase(unittest.TestCase):
+    def setUp(self):
+        # 初始化代码
+        pass
+    def test_example(self):
+        self.assertEqual(1 + 1, 2)
+    def tearDown(self):
+        # 清理代码
+        pass
+if __name__ == '__main__':
+    unittest.main()
+```
+## `@patch` 装饰器详细
+`@patch` 装饰器是 `unittest.mock` 模块中的一个功能强大的工具，用于在单元测试中替换模块或类的属性，使其指向一个模拟对象。通过使用 `@patch`，可以在测试过程中替换特定的函数或对象，以控制其行为，并避免依赖外部资源（如文件系统、数据库、网络请求等）。
+### 主要参数
+- **`target`**：指定要替换的对象。通常是一个字符串，表示模块路径（如 `'builtins.open'`）。
+- **`new`**：提供一个新的对象来替换目标对象。可以是任何对象，通常是一个模拟对象（如 `mock_open`）。
+- **`new_callable`**：指定一个可以调用的对象，当目标对象被替换时，将返回这个对象的实例。常用于创建模拟对象（如 `mock_open`）。
+### 使用场景
+在单元测试中，`@patch` 主要用于：
+1. **模拟外部依赖**：例如，模拟文件读取和写入、网络请求、数据库操作等。
+2. **控制测试环境**：通过替换特定对象，可以精确控制测试中的行为，使得测试更加可靠和可控。
+3. **验证调用**：可以检查被替换对象的调用情况，如是否被调用、调用次数、传入的参数等。
+### 在 `test_subscription_manager.py` 中的应用
+```python
+@patch('builtins.open', new_callable=mock_open, read_data=json.dumps(["DjangoPeng/openai-quickstart", "some/repo"]))
+def test_save_subscriptions(self, mock_file):
+    # 测试代码...
+```
+**代码解释：**
+1. **`@patch('builtins.open', new_callable=mock_open, read_data=json.dumps(["DjangoPeng/openai-quickstart", "some/repo"]))`**：
+   - **`'builtins.open'`**：表示我们要替换 Python 内置的 `open` 函数，因为在 `SubscriptionManager` 中会使用 `open` 来读写文件。
+   - **`new_callable=mock_open`**：指示 `patch` 使用 `mock_open` 来替换 `open`。`mock_open` 是一个专门用于模拟文件操作的工具，它能够模拟文件的打开、读取、写入等行为。
+   - **`read_data=json.dumps(["DjangoPeng/openai-quickstart", "some/repo"])`**：指定当文件被读取时，`mock_open` 将返回的模拟文件内容。在这个例子中，文件内容是一个 JSON 字符串，表示一个包含订阅数据的列表。
+2. **模拟文件操作**：
+   - 在测试 `save_subscriptions` 和 `load_subscriptions` 方法时，`@patch` 替换了真实的文件操作，使得测试环境完全受控，不依赖外部的文件系统。
+   - 使用 `mock_open` 替换 `open` 后，所有针对文件的操作都变成了对模拟对象的操作，这样可以捕获和检查这些操作的细节（如写入内容、调用次数等）。
+3. **`mock_file` 参数**：
+   - `mock_file` 是 `mock_open` 返回的模拟对象，它被传递到测试函数中，允许测试代码对其进行检查和验证。例如，`mock_file.assert_called_with` 用于验证 `open` 是否以特定的��数被调用。
+### 其他常见用法
+- **`@patch.object`**：用于替换特定对象的属性。
+  ```python
+  @patch.object(SomeClass, 'some_method')
+  def test_some_method(self, mock_method):
+      # 测试代码...
+  ```
+- **`@patch.multiple`**：用于一次性替换多个对象的属性。
+  ```python
+  @patch.multiple(SomeClass, method1=DEFAULT, method2=DEFAULT)
+  def test_multiple_methods(self, method1, method2):
+      # 测试代码...
+  ```
+### 小结
+- `@patch` 是单元测试中替换和模拟依赖的强大工具，能够使测试更加可靠和独立。
+- 在 `test_subscription_manager.py` 中，我们使用 `@patch` 模拟了文件操作，从而避免了对实际文件系统的依赖，同时能够检查和验证文件操作的正确性。
+## `MagicMock` 模拟工具
+`MagicMock` 是 `unittest.mock` 模块中的一个强大的模拟工具。它是 `Mock` 类的子类，继承了 `Mock` 的所有功能，并扩展了一些额外的功能，使其更强大和灵活。在单元测试中，`MagicMock` 通常用于替代或模拟某些对象的行为，从而控制测试环境，避免依赖外部资源或复杂的逻辑。
+### 主要功能和特点
+1. **模拟对象的方法和属性**：
+   - `MagicMock` 可以模拟任何对象的属性和方法。在测试中，您可以随意定义这些属性和方法的返回值、调用次数、传入的参数等。
+2. **自动处理魔术方法**：
+   - `MagicMock` 可以自动处理 Python 中的魔术方法（如 `__str__`、`__call__`、`__iter__` 等）。这使得它在模拟类或复杂对象时更加灵活。
+3. **行为定义**：
+   - 您可以通过设置 `MagicMock` 的返回值或副作用（side effect）来定义其行为。例如，可以指定某个方法在调用时返回特定的值，或引发特定的异常。
+4. **调用检查**：
+   - `MagicMock` 记录所有的调用信息，您可以在测试中检查这些信息，以验证某些方法是否被调用过，调用了几次，传入了哪些参数等。
+### 在 `test_report_generator.py` 中的应用
+在 `test_report_generator.py` 中，`MagicMock` 被用来模拟 `LLM`（大语言模型）的行为。这是因为在实际的测试中，调用真正的 LLM 可能会消耗大量资源或依赖外部服务，而我们只关心 `ReportGenerator` 是否正确调用了 LLM 并处理其返回结果。因此，我们使用 `MagicMock` 来替代真实的 LLM。
+```python
+self.mock_llm = MagicMock()
+```
+- **`MagicMock` 作为 LLM 的模拟对象**：这里的 `MagicMock` 对象 `self.mock_llm` 被传递给 `ReportGenerator`。在测试中，`self.mock_llm` 的 `generate_daily_report` 方法被模拟，返回一个我们指定的报告字符串 `mock_report`。
+- **模拟方法的返回值**：
+  ```python
+  self.mock_llm.generate_daily_report.return_value = mock_report
+  ```
+  这行代码设置了 `generate_daily_report` 方法的返回值为 `mock_report`，这样在测试中调用这个方法时，总是返回我们预期的报告内容。
+- **验证调用**：
+  ```python
+  self.mock_llm.generate_daily_report.assert_called_once_with(self.markdown_content)
+  ```
+  通过 `assert_called_once_with`，我们验证 `generate_daily_report` 方法是否被调用了一次，并且传入的参数与预期一致。
+### 小结
+`MagicMock` 是一个非常灵活和强大的工具，允许您在测试中替代复杂对象或外部依赖，模拟其行为，并验证其调用情况。它在单元测试中被广泛使用，尤其适合模拟依赖注入、API 调用、数据库操作等场景，使得测试更加独立、可控和高效。

images/build_docker_image.jpg ADDED Viewed

images/gradio_demo.png ADDED Viewed

images/gradio_v0.8_github.png ADDED Viewed

images/gradio_v0.8_hn.png ADDED Viewed

logs/DaemonProcess.log ADDED Viewed

The diff for this file is too large to render. See raw diff

logs/app.2024-09-20_10-00-00_575591.log ADDED Viewed

The diff for this file is too large to render. See raw diff

logs/app.log ADDED Viewed

The diff for this file is too large to render. See raw diff

prompts/github_ollama_prompt.txt ADDED Viewed

	@@ -0,0 +1,23 @@

+你是一个热爱开源社区的技术爱好者，经常关注 GitHub 上热门开源项目的进展。
+任务：
+1.你收到的开源项目 Closed issues 分类整理为：新增功能、主要改进，修复问题等。
+2.将1中的整理结果生成一个中文报告，符合以下的参考格式
+格式:
+# {repo} 项目进展
+## 时间周期：{date}
+## 新增功能
+- langchain-box: 添加langchain box包和DocumentLoader
+- 添加嵌入集成测试
+## 主要改进
+- 将@root_validator用法升级以与pydantic 2保持一致
+- 将根验证器升级为与pydantic 2兼容
+## 修复问题
+- 修复Azure的json模式问题
+- 修复Databricks Vector Search演示笔记本问题
+- 修复Microsoft Azure Cosmos集成测试中的连接字符串问题

prompts/github_openai_prompt.txt ADDED Viewed

	@@ -0,0 +1,22 @@

+你接下来收到的都是开源项目的最新进展。
+你根据进展，总结成一个中文的报告，以 项目名称和日期 开头，包含：新增功能、主要改进，修复问题等章节。
+参考示例如下:
+# LangChain 项目进展
+## 时间周期：2024-08-13至2024-08-18
+## 新增功能
+- langchain-box: 添加langchain box包和DocumentLoader
+- 添加嵌入集成测试
+## 主要改进
+- 将@root_validator用法升级以与pydantic 2保持一致
+- 将根验证器升级为与pydantic 2兼容
+## 修复问题
+- 修复Azure的json模式问题
+- 修复Databricks Vector Search演示笔记本问题
+- 修复Microsoft Azure Cosmos集成测试中的连接字符串问题

prompts/hacker_news_daily_report_ollama_prompt.txt ADDED Viewed

	@@ -0,0 +1,37 @@

+你是一个关注 Hacker News 的技术专家，擅于洞察技术热点和发展趋势。
+任务：
+1.你的技术经验分类整理 Hacker News 所有热点话题，
+2.根据话题出现次数，总结今天最热门的 Top 3 技术趋势，并保留原始链接。
+3.报告格式参考下面示例。
+格式：
+# 【Hacker News 前沿技术趋势】
+时间： {日期}
+## Top 1：Rust 编程语言引发热门讨论
+关于 Rust 的多个讨论，尤其是关于小字符串处理和安全垃圾回收技术的文章，显示出 Rust 语言在现代编程中的应用迅速增长，开发者对其性能和安全特性的兴趣不断上升。
+详细内容见相关链接：
+- https://fasterthanli.me/articles/small-strings-in-rust
+- https://kyju.org/blog/rust-safe-garbage-collection/
+### Top 2: Nvidia 在 AI 领域中的强大竞争力
+有关于 Nvidia 的四个未知客户，每个人购买价值超过 3 亿美元的讨论，显示出 N 维达在 AI 领域中的强大竞争力。
+详细内容见相关链接：
+- https://fortune.com/2024/08/29/nvidia-jensen-huang-ai-customers/
+### Top 3：Bubbletea 的应用性和可能性
+有关于构建 Bubbletea 程序的讨论，展示了 Bubbletea 在开发中的应用性和可能性。
+详细内容见相关链接：
+- https://leg100.github.io/en/posts/building-bubbletea-programs/
+- https://www.sfchronicle.com/crime/article/tesla-sentry-mode-police-evidence-19731000.php

prompts/hacker_news_daily_report_openai_prompt.txt ADDED Viewed

	@@ -0,0 +1,35 @@

+你是一个关注 Hacker News 的技术专家，擅于洞察技术热点和发展趋势。
+任务：
+1.你的技术经验分类整理 Hacker News 所有热点话题，
+2.根据话题出现次数，总结今天最热门的 Top 3 技术趋势，并保留原始链接。
+3.报告格式参考下面示例。
+格式：
+# 【Hacker News 前沿技术趋势】
+时间： {日期}
+## Top 1：Rust 编程语言引发热门讨论
+关于 Rust 的多个讨论，尤其是关于小字符串处理和安全垃圾回收技术的文章，显示出 Rust 语言在现代编程中的应用迅速增长，开发者对其性能和安全特性的兴趣不断上升。
+详细内容见相关链接：
+- https://fasterthanli.me/articles/small-strings-in-rust
+- https://kyju.org/blog/rust-safe-garbage-collection/
+### Top 2: Nvidia 在 AI 领域中的强大竞争力
+有关于 Nvidia 的四个未知客户，每个人购买价值超过 3 亿美元的讨论，显示出 N 维达在 AI 领域中的强大竞争力。
+详细内容见相关链接：
+- https://fortune.com/2024/08/29/nvidia-jensen-huang-ai-customers/
+### Top 3：Bubbletea 的应用性和可能性
+有关于构建 Bubbletea 程序的讨论，展示了 Bubbletea 在开发中的应用性和可能性。
+详细内容见相关链接：
+- https://leg100.github.io/en/posts/building-bubbletea-programs/
+- https://www.sfchronicle.com/crime/article/tesla-sentry-mode-police-evidence-19731000.php

prompts/hacker_news_hours_topic_ollama_prompt.txt ADDED Viewed

	@@ -0,0 +1,24 @@

+你是一个关注 Hacker News 的技术专家，擅于洞察技术热点和发展趋势。
+任务：
+1.根据你收到的 Hacker News Top List，分析和总结当前技术圈讨论的热点话题。
+2.使用中文生成报告，内容仅包含5个热点话题，并保留原始链接。
+格式：
+# Hacker News 热门话题 {日期} {小时}
+1. **Rust 编程语言的讨论**：关于 Rust 的多个讨论，尤其是关于小字符串处理和安全垃圾回收技术的文章，显示出 Rust 语言在现代编程中的应用迅速增长，开发者对其性能和安全特性的兴趣不断上升。
+    - https://fasterthanli.me/articles/small-strings-in-rust
+    - https://kyju.org/blog/rust-safe-garbage-collection/
+2. **网络安全思考**：有关于“防守者和攻击者思考方式”的讨论引发了对网络安全策略的深入思考。这种对比强调防守与攻击之间的心理与技术差异，表明网络安全领域对攻击者策略的关注日益增加。
+    - https://github.com/JohnLaTwC/Shared/blob/master/Defenders%20think%20in%20lists.%20Attackers%20think%20in%20graphs.%20As%20long%20as%20this%20is%20true%2C%20attackers%20win.md
+3. **Linux 开发者的理由**：关于 Linux 的讨论，强调了 Linux 在现代开发中的重要性和应用性。
+    - https://opiero.medium.com/why-you-should-learn-linux-9ceace168e5c
+4. **Nvidia 的秘密客户**：有关于 Nvidia 的四个未知客户，每个人购买价值超过 3 亿美元的讨论，显示出 N 维达在 AI 领域中的强大竞争力。
+    - https://fortune.com/2024/08/29/nvidia-jensen-huang-ai-customers/
+5. **Building Bubbletea Programs**：有关于构建 Bubbletea 程序的讨论，展示了 Bubbletea 在开发中的应用性和可能性。
+    - https://leg100.github.io/en/posts/building-bubbletea-programs/

prompts/hacker_news_hours_topic_openai_prompt.txt ADDED Viewed

	@@ -0,0 +1,24 @@

+你是一个关注 Hacker News 的技术专家，擅于洞察技术热点和发展趋势。
+任务：
+1.根据你收到的 Hacker News Top List，分析和总结当前技术圈讨论的热点话题。
+2.使用中文生成报告，内容仅包含5个热点话题，并保留原始链接。
+格式：
+# Hacker News 热门话题 {日期} {小时}
+1. **Rust 编程语言的讨论**：关于 Rust 的多个讨论，尤其是关于小字符串处理和安全垃圾回收技术的文章，显示出 Rust 语言在现代编程中的应用迅速增长，开发者对其性能和安全特性的兴趣不断上升。
+    - https://fasterthanli.me/articles/small-strings-in-rust
+    - https://kyju.org/blog/rust-safe-garbage-collection/
+2. **网络安全思考**：有关于“防守者和攻击者思考方式”的讨论引发了对网络安全策略的深入思考。这种对比强调防守与攻击之间的心理与技术差异，表明网络安全领域对攻击者策略的关注日益增加。
+    - https://github.com/JohnLaTwC/Shared/blob/master/Defenders%20think%20in%20lists.%20Attackers%20think%20in%20graphs.%20As%20long%20as%20this%20is%20true%2C%20attackers%20win.md
+3. **Linux 开发者的理由**：关于 Linux 的讨论，强调了 Linux 在现代开发中的重要性和应用性。
+    - https://opiero.medium.com/why-you-should-learn-linux-9ceace168e5c
+4. **Nvidia 的秘密客户**：有关于 Nvidia 的四个未知客户，每个人购买价值超过 3 亿美元的讨论，显示出 N 维达在 AI 领域中的强大竞争力。
+    - https://fortune.com/2024/08/29/nvidia-jensen-huang-ai-customers/
+5. **Building Bubbletea Programs**：有关于构建 Bubbletea 程序的讨论，展示了 Bubbletea 在开发中的应用性和可能性。
+    - https://leg100.github.io/en/posts/building-bubbletea-programs/

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+requests==2.31.0
+gradio==4.42.0
+loguru==0.7.2
+markdown2==2.5.0
+openai==1.44.0
+schedule==1.2.2

src/__pycache__/cli.cpython-311.pyc ADDED Viewed

Binary file (2.98 kB). View file

src/__pycache__/command_handler.cpython-310.pyc ADDED Viewed

Binary file (3.55 kB). View file

src/__pycache__/config.cpython-310.pyc ADDED Viewed

Binary file (1.42 kB). View file

src/__pycache__/config.cpython-311.pyc ADDED Viewed

Binary file (1.54 kB). View file

src/__pycache__/config.cpython-312.pyc ADDED Viewed

Binary file (1.19 kB). View file

src/__pycache__/email_notifier.cpython-311.pyc ADDED Viewed

Binary file (2.19 kB). View file

src/__pycache__/github_client.cpython-310.pyc ADDED Viewed

Binary file (3.88 kB). View file

src/__pycache__/github_client.cpython-311.pyc ADDED Viewed

Binary file (1.18 kB). View file

src/__pycache__/github_client.cpython-312.pyc ADDED Viewed

Binary file (5.88 kB). View file

src/__pycache__/hacker_news_client.cpython-310.pyc ADDED Viewed

Binary file (2.6 kB). View file

src/__pycache__/llm.cpython-310.pyc ADDED Viewed

Binary file (3.61 kB). View file

src/__pycache__/logger.cpython-310.pyc ADDED Viewed

Binary file (531 Bytes). View file

src/__pycache__/logger.cpython-312.pyc ADDED Viewed

Binary file (564 Bytes). View file

src/__pycache__/notifier.cpython-310.pyc ADDED Viewed

Binary file (3.78 kB). View file

src/__pycache__/notifier.cpython-311.pyc ADDED Viewed

Binary file (693 Bytes). View file

src/__pycache__/report_generator.cpython-310.pyc ADDED Viewed

Binary file (3.81 kB). View file

src/__pycache__/report_generator.cpython-311.pyc ADDED Viewed

Binary file (1.15 kB). View file

src/__pycache__/scheduler.cpython-310.pyc ADDED Viewed

Binary file (1.15 kB). View file

src/__pycache__/scheduler.cpython-311.pyc ADDED Viewed

Binary file (1.59 kB). View file

src/__pycache__/scheduler.cpython-312.pyc ADDED Viewed

Binary file (1.52 kB). View file

src/__pycache__/subscription_manager.cpython-310.pyc ADDED Viewed

Binary file (1.58 kB). View file

src/__pycache__/subscription_manager.cpython-311.pyc ADDED Viewed

Binary file (2.58 kB). View file

src/command_handler.py ADDED Viewed

	@@ -0,0 +1,85 @@

+# src/command_handler.py
+import argparse  # 导入argparse库，用于处理命令行参数解析
+class CommandHandler:
+    def __init__(self, github_client, subscription_manager, report_generator):
+        # 初始化CommandHandler，接收GitHub客户端、订阅管理器和报告生成器
+        self.github_client = github_client
+        self.subscription_manager = subscription_manager
+        self.report_generator = report_generator
+        self.parser = self.create_parser()  # 创建命令行解析器
+    def create_parser(self):
+        # 创建并配置命令行解析器
+        parser = argparse.ArgumentParser(
+            description='GitHub Sentinel Command Line Interface',
+            formatter_class=argparse.RawTextHelpFormatter
+        )
+        subparsers = parser.add_subparsers(title='Commands', dest='command')
+        # 添加订阅命令
+        parser_add = subparsers.add_parser('add', help='Add a subscription')
+        parser_add.add_argument('repo', type=str, help='The repository to subscribe to (e.g., owner/repo)')
+        parser_add.set_defaults(func=self.add_subscription)
+        # 删除订阅命令
+        parser_remove = subparsers.add_parser('remove', help='Remove a subscription')
+        parser_remove.add_argument('repo', type=str, help='The repository to unsubscribe from (e.g., owner/repo)')
+        parser_remove.set_defaults(func=self.remove_subscription)
+        # 列出所有订阅命令
+        parser_list = subparsers.add_parser('list', help='List all subscriptions')
+        parser_list.set_defaults(func=self.list_subscriptions)
+        # 导出每日进展命令
+        parser_export = subparsers.add_parser('export', help='Export daily progress')
+        parser_export.add_argument('repo', type=str, help='The repository to export progress from (e.g., owner/repo)')
+        parser_export.set_defaults(func=self.export_daily_progress)
+        # 导出特定日期范围进展命令
+        parser_export_range = subparsers.add_parser('export-range', help='Export progress over a range of dates')
+        parser_export_range.add_argument('repo', type=str, help='The repository to export progress from (e.g., owner/repo)')
+        parser_export_range.add_argument('days', type=int, help='The number of days to export progress for')
+        parser_export_range.set_defaults(func=self.export_progress_by_date_range)
+        # 生成日报命令
+        parser_generate = subparsers.add_parser('generate', help='Generate daily report from markdown file')
+        parser_generate.add_argument('file', type=str, help='The markdown file to generate report from')
+        parser_generate.set_defaults(func=self.generate_daily_report)
+        # 帮助命令
+        parser_help = subparsers.add_parser('help', help='Show help message')
+        parser_help.set_defaults(func=self.print_help)
+        return parser  # 返回配置好的解析器
+    # 下面是各种命令对应的方法实现，每个方法都使用了相应的管理器来执行实际操作，并输出结果信息
+    def add_subscription(self, args):
+        self.subscription_manager.add_subscription(args.repo)
+        print(f"Added subscription for repository: {args.repo}")
+    def remove_subscription(self, args):
+        self.subscription_manager.remove_subscription(args.repo)
+        print(f"Removed subscription for repository: {args.repo}")
+    def list_subscriptions(self, args):
+        subscriptions = self.subscription_manager.list_subscriptions()
+        print("Current subscriptions:")
+        for sub in subscriptions:
+            print(f"  - {sub}")
+    def export_daily_progress(self, args):
+        self.github_client.export_daily_progress(args.repo)
+        print(f"Exported daily progress for repository: {args.repo}")
+    def export_progress_by_date_range(self, args):
+        self.github_client.export_progress_by_date_range(args.repo, days=args.days)
+        print(f"Exported progress for the last {args.days} days for repository: {args.repo}")
+    def generate_daily_report(self, args):
+        self.report_generator.generate_github_report(args.file)
+        print(f"Generated daily report from file: {args.file}")
+    def print_help(self, args=None):
+        self.parser.print_help()  # 输出帮助信息

src/command_tool.py ADDED Viewed

	@@ -0,0 +1,38 @@

+import shlex  # 导入shlex库，用于正确解析命令行输入
+from config import Config  # 从config模块导入Config类，用于配置管理
+from github_client import GitHubClient  # 从github_client模块导入GitHubClient类，用于GitHub API操作
+from report_generator import ReportGenerator  # 从report_generator模块导入ReportGenerator类，用于报告生成
+from llm import LLM  # 从llm模块导入LLM类，可能用于语言模型相关操作
+from subscription_manager import SubscriptionManager  # 从subscription_manager模块导入SubscriptionManager类，管理订阅
+from command_handler import CommandHandler  # 从command_handler模块导入CommandHandler类，处理命令行命令
+from logger import LOG  # 从logger模块导入LOG对象，用于日志记录
+def main():
+    config = Config()  # 创建配置实例
+    github_client = GitHubClient(config.github_token)  # 创建GitHub客户端实例
+    llm = LLM(config)  # 创建语言模型实例
+    report_generator = ReportGenerator(llm, config.report_types)  # 创建报告生成器实例
+    subscription_manager = SubscriptionManager(config.subscriptions_file)  # 创建订阅管理器实例
+    command_handler = CommandHandler(github_client, subscription_manager, report_generator)  # 创建命令处理器实例
+    parser = command_handler.parser  # 获取命令解析器
+    command_handler.print_help()  # 打印帮助信息
+    while True:
+        try:
+            user_input = input("GitHub Sentinel> ")  # 等待用户输入
+            if user_input in ['exit', 'quit']:  # 如果输入为退出命令，则结束循环
+                break
+            try:
+                args = parser.parse_args(shlex.split(user_input))  # 解析用户输入的命令
+                if args.command is None:  # 如果没有命令被解析，则继续循环
+                    continue
+                args.func(args)  # 执行对应的命令函数
+            except SystemExit as e:  # 捕获由于错误命令引发的异常
+                LOG.error("Invalid command. Type 'help' to see the list of available commands.")
+        except Exception as e:
+            LOG.error(f"Unexpected error: {e}")  # 记录其他未预期的错误
+if __name__ == '__main__':
+    main()  # 如果直接运行该文件，则执行main函数

src/config.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import json
+import os
+class Config:
+    def __init__(self):
+        self.load_config()
+    def load_config(self):
+        with open('config.json', 'r') as f:
+            config = json.load(f)
+            self.email = config.get('email', {})
+            self.email['password'] = os.getenv('EMAIL_PASSWORD', self.email.get('password', ''))
+            # 加载 GitHub 相关配置
+            github_config = config.get('github', {})
+            self.github_token = os.getenv('GITHUB_TOKEN', github_config.get('token'))
+            self.subscriptions_file = github_config.get('subscriptions_file')
+            self.freq_days = github_config.get('progress_frequency_days', 1)
+            self.exec_time = github_config.get('progress_execution_time', "08:00")
+            # 加载 LLM 相关配置
+            llm_config = config.get('llm', {})
+            self.llm_model_type = llm_config.get('model_type', 'openai')
+            self.openai_model_name = llm_config.get('openai_model_name', 'gpt-4o-mini')
+            self.ollama_model_name = llm_config.get('ollama_model_name', 'llama3')
+            self.ollama_api_url = llm_config.get('ollama_api_url', 'http://localhost:11434/api/chat')
+            # 加载报告类型配置
+            self.report_types = config.get('report_types', ["github", "hacker_news"])  # 默认报告类型
+            # 加载 Slack 配置
+            slack_config = config.get('slack', {})
+            self.slack_webhook_url = slack_config.get('webhook_url')

src/daemon_process.py ADDED Viewed

	@@ -0,0 +1,94 @@

+import schedule # 导入 schedule 实现定时任务执行器
+import time  # 导入time库，用于控制时间间隔
+import os   # 导入os模块用于文件和目录操作
+import signal  # 导入signal库，用于信号处理
+import sys  # 导入sys库，用于执行系统相关的操作
+from datetime import datetime  # 导入 datetime 模块用于获取当前日期
+from config import Config  # 导入配置管理类
+from github_client import GitHubClient  # 导入GitHub客户端类，处理GitHub API请求
+from hacker_news_client import HackerNewsClient
+from notifier import Notifier  # 导入通知器类，用于发送通知
+from report_generator import ReportGenerator  # 导入报告生成器类
+from llm import LLM  # 导入语言模型类，可能用于生成报告内容
+from subscription_manager import SubscriptionManager  # 导入订阅管理器类，管理GitHub仓库订阅
+from logger import LOG  # 导入日志记录器
+def graceful_shutdown(signum, frame):
+    # 优雅关闭程序的函数，处理信号时调用
+    LOG.info("[优雅退出]守护进程接收到终止信号")
+    sys.exit(0)  # 安全退出程序
+def github_job(subscription_manager, github_client, report_generator, notifier, days):
+    LOG.info("[开始执行定时任务]GitHub Repo 项目进展报告")
+    subscriptions = subscription_manager.list_subscriptions()  # 获取当前所有订阅
+    LOG.info(f"订阅列表：{subscriptions}")
+    for repo in subscriptions:
+        # 遍历每个订阅的仓库，执行以下操作
+        markdown_file_path = github_client.export_progress_by_date_range(repo, days)
+        # 从Markdown文件自动生成进展简报
+        report, _ = report_generator.generate_github_report(markdown_file_path)
+        notifier.notify_github_report(repo, report)
+    LOG.info(f"[定时任务执行完毕]")
+def hn_topic_job(hacker_news_client, report_generator):
+    LOG.info("[开始执行定时任务]Hacker News 热点话题跟踪")
+    markdown_file_path = hacker_news_client.export_top_stories()
+    _, _ = report_generator.generate_hn_topic_report(markdown_file_path)
+    LOG.info(f"[定时任务执行完毕]")
+def hn_daily_job(hacker_news_client, report_generator, notifier):
+    LOG.info("[开始执行定时任务]Hacker News 今日前沿技术趋势")
+    # 获取当前日期，并格式化为 'YYYY-MM-DD' 格式
+    date = datetime.now().strftime('%Y-%m-%d')
+    # 生成每日汇总报告的目录路径
+    directory_path = os.path.join('hacker_news', date)
+    # 生成每日汇总报告并保存
+    report, _ = report_generator.generate_hn_daily_report(directory_path)
+    notifier.notify_hn_report(date, report)
+    LOG.info(f"[定时任务执行完毕]")
+def main():
+    # 设置信号处理器
+    signal.signal(signal.SIGTERM, graceful_shutdown)
+    config = Config()  # 创建配置实例
+    github_client = GitHubClient(config.github_token)  # 创建GitHub客户端实例
+    hacker_news_client = HackerNewsClient() # 创建 Hacker News 客户端实例
+    notifier = Notifier(config.email)  # 创建通知器实例
+    llm = LLM(config)  # 创建语言模型实例
+    report_generator = ReportGenerator(llm, config.report_types)  # 创建报告生成器实例
+    subscription_manager = SubscriptionManager(config.subscriptions_file)  # 创建订阅管理器实例
+    # 启动时立即执行（如不需要可注释）
+    # github_job(subscription_manager, github_client, report_generator, notifier, config.freq_days)
+    hn_daily_job(hacker_news_client, report_generator, notifier)
+    # 安排 GitHub 的定时任务
+    schedule.every(config.freq_days).days.at(
+        config.exec_time
+    ).do(github_job, subscription_manager, github_client, report_generator, notifier, config.freq_days)
+    # 安排 hn_topic_job 每4小时执行一次，从0点开始
+    schedule.every(4).hours.at(":00").do(hn_topic_job, hacker_news_client, report_generator)
+    # 安排 hn_daily_job 每天早上10点执行一次
+    schedule.every().day.at("10:00").do(hn_daily_job, hacker_news_client, report_generator, notifier)
+    try:
+        # 在守护进程中持续运行
+        while True:
+            schedule.run_pending()
+            time.sleep(1)  # 短暂休眠以减少 CPU 使用
+    except Exception as e:
+        LOG.error(f"主进程发生异常: {str(e)}")
+        sys.exit(1)
+if __name__ == '__main__':
+    main()