hmnshudhmn24 commited on 18 days ago

Commit

602b5b1

verified ·

1 Parent(s): 2860b6f

Upload 23 files

Browse files

Files changed (23) hide show

.gitignore +3 -0
LICENSE +3 -0
README.md +103 -3
config/graph_schema.json +10 -0
config/model_config.yaml +3 -0
data/examples.json +9 -0
data/synthetic_intents.json +6 -0
model_card.md +7 -0
notebooks/intentgraph_demo.ipynb +1 -0
requirements.txt +1 -0
scripts/export_model.py +5 -0
scripts/preprocess_data.py +5 -0
src/__init__.py +1 -0
src/graph_builder.py +10 -0
src/graph_updater.py +5 -0
src/inference.py +15 -0
src/intent_extractor.py +7 -0
src/tokenizer.py +3 -0
tests/test_graph_building.py +6 -0
tests/test_intent_extraction.py +6 -0
training/evaluate.py +5 -0
training/loss.py +2 -0
training/train.py +5 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,3 @@

+__pycache__/
+.env
+*.pyc

LICENSE ADDED Viewed

	@@ -0,0 +1,3 @@

+Apache License
+Version 2.0, January 2004
+http://www.apache.org/licenses/

README.md CHANGED Viewed

@@ -1,3 +1,103 @@
----
-license: apache-2.0
----

+# IntentGraphLM 🚀
+**IntentGraphLM** is an open-source language model pipeline that converts raw natural language into **dynamic intent graphs**, enabling smarter agents, workflow orchestration, and multi-step task planning.
+This project is designed to be **lightweight, extensible, and Hugging Face–ready**, with strong future scope in agentic AI systems.
+---
+## 🔍 What Problem Does It Solve?
+Traditional intent detection returns flat labels.
+IntentGraphLM goes further by:
+- Extracting **multiple intents**
+- Modeling **relationships between intents**
+- Representing them as a **directed graph**
+- Enabling **dynamic updates** during conversations
+---
+## ✨ Key Features
+- 🧠 Intent extraction from raw text
+- 🕸️ Graph-based intent representation
+- 🔁 Dynamic intent graph updates
+- ⚡ Lightweight, dependency-minimal design
+- 🤗 Hugging Face–compatible inference pipeline
+- 🧩 Modular and extensible architecture
+---
+## 📂 Project Structure
+```
+intentgraph-lm/
+├── config/
+├── data/
+├── src/
+├── training/
+├── scripts/
+├── tests/
+├── notebooks/
+├── README.md
+├── model_card.md
+├── requirements.txt
+└── LICENSE
+```
+---
+## ⚙️ Installation
+```bash
+pip install -r requirements.txt
+```
+---
+## 🚀 Quick Usage
+```python
+from src import IntentGraphPipeline
+pipeline = IntentGraphPipeline()
+output = pipeline("Book a flight and then reserve a hotel")
+print(output)
+```
+---
+## 🧠 How It Works
+1. Tokenization
+2. Intent Extraction
+3. Graph Building
+4. Dynamic Updates
+---
+## 🧪 Testing
+```bash
+pytest tests/
+```
+---
+## 🔮 Future Scope
+- Transformer-based intent extraction
+- Hierarchical intent graphs
+- Agent tool planning
+- Multilingual support
+- Hugging Face pipeline release
+- Gradio demo space
+---
+## 📜 License
+Apache License 2.0

config/graph_schema.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "node_types": [
+    "intent"
+  ],
+  "edge_types": [
+    "depends_on",
+    "follows"
+  ],
+  "weighted": true
+}

config/model_config.yaml ADDED Viewed

	@@ -0,0 +1,3 @@

+model_name: intentgraph-lm
+max_intents: 5
+confidence_threshold: 0.5

data/examples.json ADDED Viewed

	@@ -0,0 +1,9 @@

+[
+  {
+    "text": "Book a flight and then reserve a hotel",
+    "intents": [
+      "book_flight",
+      "reserve_hotel"
+    ]
+  }
+]

data/synthetic_intents.json ADDED Viewed

	@@ -0,0 +1,6 @@

+[
+  "book_flight",
+  "reserve_hotel",
+  "order_food",
+  "check_weather"
+]

model_card.md ADDED Viewed

	@@ -0,0 +1,7 @@

+---
+language: en
+license: apache-2.0
+pipeline_tag: text-to-graph
+---
+# IntentGraphLM

notebooks/intentgraph_demo.ipynb ADDED Viewed

	@@ -0,0 +1 @@


1	+ {"cells": [], "metadata": {}, "nbformat": 4, "nbformat_minor": 5}

requirements.txt ADDED Viewed

	@@ -0,0 +1 @@


1	+ networkx

scripts/export_model.py ADDED Viewed

	@@ -0,0 +1,5 @@

+def export():
+    print('Exporting model')
+if __name__ == '__main__':
+    export()

scripts/preprocess_data.py ADDED Viewed

	@@ -0,0 +1,5 @@

+def preprocess():
+    print('Preprocessing data')
+if __name__ == '__main__':
+    preprocess()

src/__init__.py ADDED Viewed

	@@ -0,0 +1 @@


1	+ from .inference import IntentGraphPipeline

src/graph_builder.py ADDED Viewed

	@@ -0,0 +1,10 @@

+import networkx as nx
+class GraphBuilder:
+    def build(self, intents):
+        graph = nx.DiGraph()
+        for i, intent in enumerate(intents):
+            graph.add_node(intent, type='intent')
+            if i > 0:
+                graph.add_edge(intents[i-1], intent, weight=1.0)
+        return graph

src/graph_updater.py ADDED Viewed

	@@ -0,0 +1,5 @@

+class GraphUpdater:
+    def update(self, graph, new_intent):
+        if new_intent not in graph:
+            graph.add_node(new_intent, type='intent')
+        return graph

src/inference.py ADDED Viewed

	@@ -0,0 +1,15 @@

+from .tokenizer import SimpleTokenizer
+from .intent_extractor import IntentExtractor
+from .graph_builder import GraphBuilder
+class IntentGraphPipeline:
+    def __init__(self):
+        self.tokenizer = SimpleTokenizer()
+        self.extractor = IntentExtractor()
+        self.builder = GraphBuilder()
+    def __call__(self, text: str):
+        tokens = self.tokenizer.tokenize(text)
+        intents = self.extractor.extract(tokens)
+        graph = self.builder.build(intents)
+        return {'intents': intents, 'nodes': list(graph.nodes), 'edges': list(graph.edges)}

src/intent_extractor.py ADDED Viewed

	@@ -0,0 +1,7 @@

+class IntentExtractor:
+    def extract(self, tokens):
+        intents = []
+        for token in tokens:
+            if token in ['book','reserve','order','check']:
+                intents.append(token)
+        return list(set(intents))

src/tokenizer.py ADDED Viewed

	@@ -0,0 +1,3 @@

+class SimpleTokenizer:
+    def tokenize(self, text: str):
+        return text.lower().split()

tests/test_graph_building.py ADDED Viewed

	@@ -0,0 +1,6 @@

+from src.graph_builder import GraphBuilder
+def test_graph():
+    builder = GraphBuilder()
+    graph = builder.build(['a','b'])
+    assert len(graph.nodes) == 2

tests/test_intent_extraction.py ADDED Viewed

	@@ -0,0 +1,6 @@

+from src.intent_extractor import IntentExtractor
+def test_extract():
+    extractor = IntentExtractor()
+    intents = extractor.extract(['book','flight'])
+    assert 'book' in intents

training/evaluate.py ADDED Viewed

	@@ -0,0 +1,5 @@

+def evaluate():
+    print('Evaluation placeholder')
+if __name__ == '__main__':
+    evaluate()

training/loss.py ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ def loss_fn(pred, target):
2	+ return abs(len(pred) - len(target))

training/train.py ADDED Viewed

	@@ -0,0 +1,5 @@

+def train():
+    print('Training placeholder')
+if __name__ == '__main__':
+    train()