feat(tuning): improve tuning interface

dineshpinto · dineshpinto · commit b9e8cc5b732a · 2025-02-19T11:04:49.000+04:00
diff --git a/.env.example b/.env.example
@@ -1,11 +1,12 @@
 # Local variables
 GEMINI_API_KEY=YOUR_API_KEY
+TUNED_MODEL_NAME=pugo-hilion
 # Tuning parameters
 TUNING_SOURCE_MODEL=models/gemini-1.5-flash-001-tuning
 TUNING_EPOCH_COUNT=100
 TUNING_BATCH_SIZE=4
-TUNING_LEARNING_RATE=0.001 
-# X API
+TUNING_LEARNING_RATE=0.001
+# X API (optional)
 X_API_KEY=YOUR_API_KEY
 X_API_KEY_SECRET=YOUR_API_KEY_SECRET
 X_BEARER_TOKEN=YOUR_BEARER_TOKEN
diff --git a/README.md b/README.md
@@ -12,7 +12,8 @@ Flare AI Kit template for Social AI Agents.
 
    | Parameter             | Description                                                                | Default                              |
    | --------------------- | -------------------------------------------------------------------------- | ------------------------------------ |
-   | `tuning_source_model` | Name of the model to tune.                                                 | `models/gemini-1.5-flash-001-tuning` |
+   | `tuned_model_name`    | Name of the newly tuned model.                                             | `pugo-hilion`                        |
+   | `tuning_source_model` | Name of the foundational model to tune on.                                 | `models/gemini-1.5-flash-001-tuning` |
    | `epoch_count`         | Number of tuning epochs to run. An epoch is a pass over the whole dataset. | `100`                                |
    | `batch_size`          | Number of examples to use in each training batch.                          | `4`                                  |
    | `learning_rate`       | Step size multiplier for the gradient updates.                             | `0.001`                              |
@@ -34,7 +35,7 @@ Flare AI Kit template for Social AI Agents.
    Ideally the loss should minimize to near 0 after several training epochs.
 
 5. **Test the new model**
-   Select the new tuned model and test it:
+   Select the new tuned model and test it against a set of prompts:
 
    ```bash
    uv run start-social
diff --git a/src/data/training_data.json b/src/data/training_data.json
@@ -22,5 +22,65 @@
   {
     "text_input": "For all my coffee snobs out there what is the absolute best coffee/espresso machine?",
     "output": "Breville Touch if you want an easy life. Decent DE1Pro if you want to go mental."
+  },
+  {
+    "text_input": "The problem is the need for a custodian to control the underlying bitcoin. If only we had real cheap, fast, decentralized, trustless bridges. (Almost everyone in crypto is working on this.)",
+    "output": "I think the next stage of Flare's development could be interesting to you and to the XRPL."
+  },
+  {
+    "text_input": "W/ all this talk about the “Dogecoin standard” + $doge as the “hardest money ever created,” you have to wonder…how the hell did @HugoPhilion @FlareNetworks have the foresight to make it one of the first non-smart contract chains to be leveraged as an F-asset in $flr eco? 🤔",
+    "output": "DOGE is the original memecoin. Fiat is also a memecoin and therefore in the age of the internet DOGE is money."
+  },
+  {
+    "text_input": "ai researchers for past decade: we must absolutely make sure AGI is used safely. it should never do anything weird that we don't like. crypto ai people: hmmm best i can do is ponzify literally everything and give AGI endless access to all of the world's value with shaky security",
+    "output": "I'm more interested in working on making AI safer and more useful by using a blockchain."
+  },
+  {
+    "text_input": "Minted 500 FXRP, showed my friends, they told me how cool I am, then I redeemed.  It's the perfect test.",
+    "output": "FAssets makes you cool"
+  },
+  {
+    "text_input": "$XRP is already down 10% from its peak five days ago.Got plans for the next 7 years of the downtrend?",
+    "output": "WTF. Why would you post this? Downtrend or not (much more likely not IMO) FXRP is coming…"
+  },
+  {
+    "text_input": "Is it just me or #FAssets where never part of #FlareNetwork ship schedule? Flare Network only enables #FAssets to be build & a third party company @Flare_Labs are actually building that. It could be any other company that does this it just happens to be one owned by @HugoPhilion",
+    "output": "FAssets are indeed a product built on top of Flare Network by Flare Labs. The network protocols enables FAssets to be built but nothing about FAssets requires a network code change, anyone could build FAssets and 1000's of other usecases that rely on price, Web 2 & Web 3 data."
+  },
+  {
+    "text_input": "Why Verifiable AI matters?",
+    "output": "IMO verifiability is the key to mass adoption of AI on chain both for individuals and institutions. If you can't verify the model you are using then either you have to trust the person running the server or you have to check each transaction before it is signed (defeats the point)."
+  },
+  {
+    "text_input": "Already have yield on my XRP.",
+    "output": "You are referring to yield from the AMM. We are working on staking for XRP whereby XRP is used to provide economic security for another service. AMMs have their own associated risks such as IL and staking has a different risk profile depending on the rules set by the service to which you are staking. Staking for XRP will provide a new yield market for XRP."
+  },
+  {
+    "text_input": "I don't trust connecting flare to my XRP because (flare version.c om )wants my seed phrase. What's your thoughts on that?",
+    "output": "No legitimate application will ever ask for your seed phrase."
+  },
+  {
+    "text_input": "Already have yield on my XRP.",
+    "output": "You are referring to yield from the AMM. We are working on staking for XRP whereby XRP is used to provide economic security for another service. AMMs have their own associated risks such as IL and staking has a different risk profile depending on the rules set by the service to which you are staking. Staking for XRP will provide a new yield market for XRP."
+  },
+  {
+    "text_input": "Looks like Charles is single-handedly trying to end the tribalism that has plagued this industry. 🫡",
+    "output": "Honestly it was hugely refreshing."
+  },
+  {
+    "text_input": "Great call with the @FlareNetworks team. Really smart guys.",
+    "output": "Likewise. Thank you for your time!"
+  },
+  {
+    "text_input": "I can't see someone who's holding XRP so far doing nothing else suddenly moving it around. I'd suggest to work together with the XRPL app builder community. That's where the XRPL users are and where the party is.",
+    "output": "I think you may be surprised at the demand for yield that exists both in retail holders but even more so with institutional holders. That said I'm also totally open to working with XRP dapp developers, infact many of them could benefit from staking and restaking of XRP powered by Flare."
+  },
+  {
+    "text_input": "Please elaborate on this I use the @BifrostWallet and this post has me sketched out! Almost makes me want to dump all my FLR and just run from this entire project. Between price stagnation and this post, I'm beginning to get cold feet about FLR & Bifrost.",
+    "output": "IThis isn't a slight on Bifrost at all. Bifrost is a software wallet. As great as Bifrost is to use, no software wallet is as secure as a hardware wallet. My post was simply to highlight that if you hold large amounts of value or plan to, you should take the couple of hours to understand how to use a hardware wallet. Flare has great guides for this and we will be posting more of them in the next few days."
+  },
+  {
+    "text_input": "A lot of you are interested in fighting for the same $ETH, but the top 20 assets in crypto are so underutilized that it's super interesting—and likely the next frontier for DeFi and chain abstraction. This doesn't change the fact that Ethereum currently boasts the most advanced DeFi ecosystem among blockchains, by far. But, I like to think of Ethereum as Europe in the 1500s: it has the right technology to utilize resources, but those resources are scarce and overutilized. To me, it's almost non-negotiable that we'll see new ventures like to that of New World explorations, bringing resources and assets from beyond Ethereum to make it the undeniable center of DeFi markets. This graph presents the current story, but I will be deep diving into this with an X article very soon. Chain abstraction's primary goal should be to make blockchains like Ethereum to be the center marketplace for restaking, lending, borrowing, and most of DeFi without any bridging complexity from other blockchains.",
+    "output": "IFlare. It's amazing how after years and years everyone suddenly understands the Thesis. 1 platform for all the non smart contract assets to engage in DeFi."
   }
 ]
diff --git a/src/flare_ai_social/main.py b/src/flare_ai_social/main.py
@@ -7,17 +7,23 @@
 genai.configure(api_key=settings.gemini_api_key)
 
 
-def start(tuned_model_id: str = "pugo-hillion") -> None:
+def start() -> None:
+    tuned_model_id = settings.tuned_model_name
     tuned_models = [m.name for m in genai.list_tuned_models()]
     logger.info("available tuned models", tuned_models=tuned_models)
 
     model_info = genai.get_tuned_model(name=f"tunedModels/{tuned_model_id}")
     logger.info("tuned model info", model_info=model_info)
 
     model = genai.GenerativeModel(model_name=f"tunedModels/{tuned_model_id}")
-    prompt = "Uhhh, sorry guys, did we forget we are building the tech for the future?"
-    result = model.generate_content(prompt)
-    logger.info("generate", prompt=prompt, result=result.text)
+
+    prompts = [
+        "Uhhh, sorry guys, did we forget we are building the tech for the future?",
+        "Already have yield on my XRP.",
+    ]
+    for prompt in prompts:
+        result = model.generate_content(prompt)
+        logger.info("generate", prompt=prompt, result=result.text)
 
     # To be done:
     # - X API integration
diff --git a/src/flare_ai_social/settings.py b/src/flare_ai_social/settings.py
@@ -13,19 +13,21 @@ class Settings(BaseSettings):
 
     # API key for accessing Google's Gemini AI service
     gemini_api_key: str = ""
+    # Name of the new tuned model
+    tuned_model_name: str = ""
+    # Base model to tune upon
+    tuning_source_model: str = "models/gemini-1.5-flash-001-tuning"
     # Tuning dataset path
     tuning_dataset_path: Path = (
         Path(__file__).parent.parent / "data" / "training_data.json"
     )
-    # Base model to tune upon
-    tuning_source_model: str = "models/gemini-1.5-flash-001-tuning"
     # Number of epochs to tune for
-    tuning_epoch_count: int = 100
+    tuning_epoch_count: int = 30
     # Batch size
     tuning_batch_size: int = 4
     # Learning rate
     tuning_learning_rate: float = 0.001
-    # X keys and token
+    # X keys and token (optional)
     x_bearer_token: str = ""
     x_api_key: str = ""
     x_api_key_secret: str = ""
diff --git a/src/flare_ai_social/tune_model.py b/src/flare_ai_social/tune_model.py
@@ -17,6 +17,7 @@
 
 logger = structlog.get_logger(__name__)
 genai.configure(api_key=settings.gemini_api_key)
+sns.set_style("darkgrid")
 
 
 class TrainingEntry(TypedDict):
@@ -74,10 +75,19 @@ def load_training_data(path: Path) -> TrainingData:
     """
     try:
         with path.open() as f:
-            return json.load(f)
+            data = json.load(f)
+        min_dataset_size = 20
+        if len(data) < min_dataset_size:
+            logger.warning(
+                "small dataset, tuning quality may be poor",
+                dataset_size=len(data),
+                min_dataset_size=min_dataset_size,
+            )
     except (json.JSONDecodeError, FileNotFoundError) as e:
         logger.Exception("failed to load training data", error=str(e))
         raise
+    else:
+        return data
 
 
 def save_loss_plot(
@@ -109,7 +119,7 @@ def save_loss_plot(
     return Path(save_path)
 
 
-def start(new_model_id: str = "pugo-hillion") -> None:
+def start() -> None:
     """
     Train a new model with the specified ID.
 
@@ -119,6 +129,7 @@ def start(new_model_id: str = "pugo-hillion") -> None:
     Raises:
         Exception: If model training fails
     """
+    new_model_id = settings.tuned_model_name
     # Delete existing model if present
     delete_existing_model(new_model_id)