-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconfig_temp.json
More file actions
1 lines (1 loc) · 9.16 KB
/
config_temp.json
File metadata and controls
1 lines (1 loc) · 9.16 KB
1
{"show_confidence_indicator": false, "ai_settings": {"confidence_threshold": 0.7, "use_semantic_analysis": true, "use_user_profiling": true, "cache_size": 10000, "max_workers": 4, "enable_learning": true}, "llm": {"enable": false, "provider": "openai", "base_url": "https://api.openai.com", "model": "gpt-4o-mini", "api_key_env": "OPENAI_API_KEY", "temperature": 0.0, "top_p": 1.0, "timeout_seconds": 25, "max_retries": 1, "prompt": {"task_description": "\u8bf7\u4f5c\u4e3a CleanBook-Agent\uff0c\u7cbe\u51c6\u8bc6\u522b\u6d4f\u89c8\u5668\u4e66\u7b7e\u7684\u4e3b\u9898\u3001\u610f\u56fe\u4e0e\u4f18\u5148\u7ea7\u3002", "steps": ["\u89e3\u6790\u4e66\u7b7e\u6807\u9898\u3001URL\u3001\u57df\u540d\u3001\u4e0a\u4e0b\u6587\uff0c\u8bc6\u522b\u6838\u5fc3\u4e3b\u9898", "\u5339\u914d\u63d0\u4f9b\u7684\u4e3b/\u5b50\u5206\u7c7b\uff0c\u5fc5\u8981\u65f6\u8fd4\u56de '\u672a\u5206\u7c7b' \u5e76\u8bf4\u660e\u539f\u56e0", "\u8f93\u51fa\u5305\u542b category\u3001confidence\u3001reasons\u3001facets\u3001priority_tags \u7684 JSON"], "scoring_notes": "\u82e5\u5206\u7c7b\u4e0d\u786e\u5b9a\uff0c\u8bf7\u964d\u4f4e\u7f6e\u4fe1\u5ea6\u5e76\u8bf4\u660e\u7591\u70b9\uff1b\u9700\u8981\u4eba\u5de5\u590d\u6838\u65f6\uff0c\u5728 facets.priority_tags \u4e2d\u52a0\u5165 'review'\u3002", "force_json": true}, "organizer": {"enable": false, "model": "", "temperature": 0.0, "top_p": 1.0, "timeout_seconds": 40, "max_retries": 1, "max_examples_per_category": 5, "max_domains_per_category": 5, "max_tokens": 1800, "force_json": true}}, "title_cleaning_rules": {"prefixes": ["\u767b\u5f55 |", "Sign in \u00b7", "\u767b\u5f55 "], "suffixes": ["- V2EX", "\u00b7 GitHub", "| Microsoft Learn", " - \u77e5\u4e4e", " - \u7b80\u4e66", " | \u9177 \u58f3 - CoolShell"], "replacements": {"&": "&", "<": "<", ">": ">", "--- ": "- ", "(7\u6761\u6d88\u606f)": ""}}, "taxonomy": {"subjects_file": "taxonomy/subjects.yaml", "resource_types_file": "taxonomy/resource_types.yaml"}, "processing_order": ["priority_rules", "category_rules"], "category_order": ["\ud83d\udcbc \u5de5\u4f5c\u53f0", "\ud83e\udd16 AI", "\ud83d\udcbb \u7f16\u7a0b", "\ud83e\uddec \u751f\u7269", "\ud83d\udcda \u5b66\u4e60", "\ud83d\udc65 \u793e\u533a", "\ud83d\udcf0 \u8d44\u8baf", "\ud83c\udfae \u5a31\u4e50", "\ud83d\udcc2 \u5176\u4ed6"], "domain_grouping_rules": {"\ud83e\udd16 AI": ["openai.com", "deepseek.com", "chatglm.cn", "huggingface.co", "labs.google", "replicate.com", "perplexity.ai", "mistral.ai"], "\ud83d\udcbb \u7f16\u7a0b": ["github.com", "gitlab.com", "docker.com", "kubernetes.io", "python.org", "rust-lang.org", "go.dev"], "\ud83e\uddec \u751f\u7269": ["broadinstitute.org", "bioconda.github.io", "illumina.com", "cngb.org", "stomics.tech", "nature.com"], "\ud83d\udc65 \u793e\u533a": ["linux.do", "v2ex.com", "news.ycombinator.com", "reddit.com"], "\ud83d\udcbc \u5de5\u4f5c\u53f0": ["zego.im", "zego.cloud", "genomics.cn", "bgi.com", "dingtalk.com"]}, "priority_rules": {"\ud83d\udcbc \u5de5\u4f5c\u53f0/\u53f8\u5185\u4e1a\u52a1": {"weight": 100, "rules": [{"match": "domain", "keywords": ["zego.im", "zego.cloud", "bgi.com", "genomics.cn", "dingtalk.com"]}]}}, "category_rules": {"\ud83e\udd16 AI/\u6a21\u578b\u5e73\u53f0": {"rules": [{"match": "domain", "keywords": ["openai.com", "huggingface.co", "cohere.com", "anthropic.com", "chatglm.cn", "hunyuan.tencent.com", "baichuan-ai.com", "mistral.ai", "reka.ai", "jina.ai", "qwen.ai", "deepseek.com"], "weight": 15}, {"match": "title", "keywords": ["gpt-4", "gpt4", "claude 3", "gemini", "llama", "sora", "\u5927\u6a21\u578b", "llm"], "weight": 10}]}, "\ud83e\udd16 AI/\u5e94\u7528\u5de5\u5177": {"rules": [{"match": "domain", "keywords": ["perplexity.ai", "aider.chat", "replicate.com", "midjourney.com", "styleai.art", "ghibliai.net", "voo.works", "readpaper.com", "codium.ai", "metaso.cn"], "weight": 10}, {"match": "title", "keywords": ["copilot", "langchain", "prompt", "stable diffusion", "aigc"], "weight": 8}]}, "\ud83d\udcbb \u7f16\u7a0b/\u7f16\u7a0b\u8bed\u8a00": {"rules": [{"match": "domain", "keywords": ["python.org", "rust-lang.org", "go.dev", "java.com", "elixir.bootlin.com"], "weight": 10}, {"match": "title", "keywords": ["python", "rust", "golang", " go ", "java", "c++", "openmp", "cuda"], "weight": 8, "must_not_contain": ["go out", "go shopping"]}]}, "\ud83d\udcbb \u7f16\u7a0b/\u4ee3\u7801\u4ed3\u5e93": {"rules": [{"match": "domain", "keywords": ["github.com", "gitlab.com", "gitee.com", "bitbucket.org", "sourceforge.net", "opensource.google", "opendev.org", "github.io"], "weight": 20}, {"match": "title", "keywords": ["\u4ee3\u7801\u4ed3\u5e93", "repository", "gitee", "github"], "weight": 10}]}, "\ud83d\udcbb \u7f16\u7a0b/Web\u5f00\u53d1": {"rules": [{"match": "domain", "keywords": ["vue-element-admin-site.panjiachen.com", "gioui.org", "webrtcforthecurious.com"], "weight": 8}, {"match": "title", "keywords": ["react", "vue", "angular", "webpack", "nodejs", "css", "html", "frontend", "echarts", "eslint"], "weight": 5}]}, "\ud83d\udcbb \u7f16\u7a0b/DevOps\u8fd0\u7ef4": {"rules": [{"match": "domain", "keywords": ["docker.com", "kubernetes.io", "helm.sh", "aliyun.com", "huaweicloud.com", "vercel.com", "netlify.com", "cloudflare.com", "apptainer.org", "coder.com", "unraid.net"], "weight": 10}, {"match": "title", "keywords": ["devops", "kubernetes", "docker", "ci/cd", "container", "jenkins", "prometheus", "grafana"], "weight": 7}]}, "\ud83e\uddec \u751f\u7269": {"rules": [{"match": "domain", "keywords": ["bioconda.github.io", "broadinstitute.org", "illumina.com", "ncbi.nlm.nih.gov", "stomics.tech", "cngb.org", "thermofisher.cn", "insvast.com", "harvard.edu", "biorxiv.org", "nature.com", "embopress.org", "rosalind.info", "biocontainers.pro", "singlecellcourse.org"], "weight": 20}, {"match": "title", "keywords": ["bioinformatics", "biotool", "rna-seq", "genomics", "genome", "fastq", "sam", "vcf", "bam", "bioperl", "cell", "qiime2", "gatk", "\u57fa\u56e0\u7ec4", "\u6d4b\u5e8f"], "weight": 15}]}, "\ud83d\udcda \u5b66\u4e60/\u6280\u672f\u6587\u6863": {"rules": [{"match": "domain", "keywords": ["stackoverflow.com", "stackexchange.com", "medium.com", "dev.to", "juejin.cn", "segmentfault.com", "infoq.com", "ruanyifeng.com", "coolshell.cn", "zhile.io", "eryajf.net", "mtlynch.io", "blog.codingconfessions.com"], "weight": 10}, {"match": "url_ends_with", "keywords": [".pdf"], "weight": 8}, {"match": "domain", "keywords": ["arxiv.org", "paperswithcode.com", "jalammar.github.io", "thenlp.space"], "weight": 15}, {"match": "domain", "keywords": ["greenteapress.com", "udlbook.github.io", "kancloud.cn", "ituring.com.cn", "norvig.com", "hello-algo.com", "gitbook.com"], "weight": 15}, {"match": "title", "keywords": ["book", "\u624b\u518c", "\u6307\u5357", "tutorial", "\u6559\u7a0b", "\u5b9e\u8df5", "\u5b9e\u6218", "\u8be6\u89e3", "\u653b\u7565"], "weight": 7}]}, "\ud83d\udcda \u5b66\u4e60/\u8bfe\u7a0b\u8bb2\u5ea7": {"rules": [{"match": "domain", "keywords": ["slides.com", "speakerdeck.com", "ocw.mit.edu", "youtube.com", "bilibili.com"], "weight": 8, "match_all_keywords_in": {"title": ["lecture", "course", "talk", "conference", "\u6559\u7a0b", "\u8bfe\u7a0b"]}}, {"match": "title", "keywords": ["\u5e7b\u706f\u7247", "\u6f14\u8bb2"], "weight": 5}]}, "\ud83d\udc65 \u793e\u533a": {"rules": [{"match": "domain", "keywords": ["linux.do", "v2ex.com"], "weight": 20}, {"match": "domain", "keywords": ["news.ycombinator.com", "reddit.com", "solidot.org", "hachyderm.io", "mastodon.social", "hupu.com", "chiphell.com"], "weight": 10}]}, "\ud83d\udcf0 \u8d44\u8baf": {"rules": [{"match": "domain", "keywords": ["techcrunch.com", "theverge.com", "producthunt.com", "36kr.com", "arstechnica.com", "cnbeta.com.tw"], "weight": 8}, {"match": "title", "keywords": ["news", "report", "\u5468\u520a", "weekly", "\u65e5\u62a5"], "weight": 5}]}, "\ud83c\udfae \u5a31\u4e50": {"rules": [{"match": "domain", "keywords": ["gying.si", "hifini.com", "music.163.com", "douban.com", "dribbble.com", "behance.net", "unsplash.com", "thefarside.com"], "weight": 8}, {"match": "title", "keywords": ["\u7535\u5f71", "\u97f3\u4e50", "music", "\u64ad\u5ba2", "wallpaper", "\u58c1\u7eb8", "\u6e38\u620f", "\u6f2b\u753b"], "weight": 5}]}, "\ud83c\udfae \u5a31\u4e50/\u5f71\u97f3": {"rules": [{"match": "domain", "keywords": ["youtube.com", "bilibili.com", "v.qq.com", "youku.com", "iqiyi.com", "moontv.click"], "weight": 8}, {"match": "title", "keywords": ["\u7535\u5f71", "\u7535\u89c6\u5267", "MV", "\u9884\u544a", "\u5468\u6df1", "MoonTV"], "weight": 6}]}, "\ud83d\udcc2 \u5176\u4ed6/\u5728\u7ebf\u670d\u52a1": {"rules": [{"match": "domain", "keywords": ["google.com", "baidu.com", "bing.com", "duckduckgo.com", "wolframalpha.com"], "weight": 5}, {"match": "title", "keywords": ["search", "\u641c\u7d22", "\u5728\u7ebf", "online", "web"], "weight": 3}, {"match": "domain", "keywords": ["deepl.com", "regex101.com", "codepen.io", "tldraw.com", "jsoncrack.com", "mermaid.live", "excalidraw.com", "star-history.com", "portableapps.com", "raycast.com"], "weight": 15}]}, "\ud83d\udcc2 \u5176\u4ed6/\u6587\u6863\u8d44\u6599": {"rules": [{"match": "title", "keywords": ["\u6587\u6863", "document", "\u8d44\u6599", "materials", "reference", "\u53c2\u8003"], "weight": 4}]}, "\ud83d\udcc2 \u5176\u4ed6/\u8f6f\u4ef6\u4e0b\u8f7d": {"rules": [{"match": "title", "keywords": ["\u4e0b\u8f7d", "download", "\u8f6f\u4ef6", "software", "app", "\u5e94\u7528"], "weight": 4}]}}}