Update run.py

2025-11-27 22:01:35 +03:00 · 2024-08-07 19:51:43 -04:00
parent 7050ed204b
commit 58690bf060
1 changed files with 115 additions and 47 deletions
--- a/run.py
+++ b/run.py
@ -13,16 +13,29 @@
 # limitations under the License.

 import logging
-
+import os
+from cryptography.fernet import Fernet
 from model import LanguageModelConfig, TransformerConfig, QuantizedWeight8bit as QW8Bit
 from runners import InferenceRunner, ModelRunner, sample_from_model

+# Secure Key Management
+KEY_ENV_VAR = 'ENCRYPTION_KEY'
+KEY = os.getenv(KEY_ENV_VAR)
+if not KEY:
+    raise ValueError(f"Encryption key must be set in the environment variable {KEY_ENV_VAR}")
+cipher_suite = Fernet(KEY)

-CKPT_PATH = "./checkpoints/"
+# Define paths
+CKPT_PATH = os.getenv('CHECKPOINT_PATH', './checkpoints/')
+TOKENIZER_PATH = os.getenv('TOKENIZER_PATH', './tokenizer.model')

+# Configure logging
+logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')

-def main():
-    grok_1_model = LanguageModelConfig(
+def initialize_model() -> LanguageModelConfig:
+    """Initialize and return the language model configuration."""
+    try:
+        model_config = LanguageModelConfig(
            vocab_size=128 * 1024,
            pad_token=0,
            eos_token=2,
@ -39,34 +52,89 @@ def main():
                num_layers=64,
                attn_output_multiplier=0.08838834764831845,
                shard_activations=True,
-            # MoE.
                num_experts=8,
                num_selected_experts=2,
-            # Activation sharding.
                data_axis="data",
                model_axis="model",
            ),
        )
+        logging.info("Model initialized successfully.")
+        return model_config
+    except Exception as e:
+        logging.error(f"Error initializing model: {e}")
+        raise
+
+def initialize_inference_runner(model: LanguageModelConfig) -> InferenceRunner:
+    """Initialize and return the inference runner."""
+    try:
        inference_runner = InferenceRunner(
            pad_sizes=(1024,),
            runner=ModelRunner(
-            model=grok_1_model,
+                model=model,
                bs_per_device=0.125,
                checkpoint_path=CKPT_PATH,
            ),
            name="local",
            load=CKPT_PATH,
-        tokenizer_path="./tokenizer.model",
+            tokenizer_path=TOKENIZER_PATH,
            local_mesh_config=(1, 8),
            between_hosts_config=(1, 1),
        )
        inference_runner.initialize()
-    gen = inference_runner.run()
+        logging.info("Inference runner initialized successfully.")
+        return inference_runner
+    except Exception as e:
+        logging.error(f"Error initializing inference runner: {e}")
+        raise

-    inp = "The answer to life the universe and everything is of course"
-    print(f"Output for prompt: {inp}", sample_from_model(gen, inp, max_len=100, temperature=0.01))
+def encrypt_message(message: str) -> str:
+    """Encrypt the message using Fernet encryption."""
+    try:
+        encrypted_message = cipher_suite.encrypt(message.encode())
+        return encrypted_message.decode()
+    except Exception as e:
+        logging.error(f"Error encrypting message: {e}")
+        raise

+def decrypt_message(encrypted_message: str) -> str:
+    """Decrypt the message using Fernet encryption."""
+    try:
+        decrypted_message = cipher_suite.decrypt(encrypted_message.encode())
+        return decrypted_message.decode()
+    except Exception as e:
+        logging.error(f"Error decrypting message: {e}")
+        raise
+
+def generate_text(prompt: str, runner: InferenceRunner) -> str:
+    """Generate text from the given prompt using the inference runner."""
+    try:
+        logging.info("Running inference...")
+        gen = runner.run()
+        return sample_from_model(gen, prompt, max_len=100, temperature=0.01)
+    except Exception as e:
+        logging.error(f"Error generating text: {e}")
+        raise
+
+def main():
+    try:
+        logging.info("Initializing model...")
+        model = initialize_model()
+        
+        logging.info("Setting up inference runner...")
+        inference_runner = initialize_inference_runner(model)
+        
+        prompt = "The answer to life the universe and everything is of course"
+        logging.info("Generating output...")
+        output = generate_text(prompt, inference_runner)
+        
+        encrypted_output = encrypt_message(output)
+        decrypted_output = decrypt_message(encrypted_output)
+        
+        logging.info(f"Output for prompt: {prompt}")
+        print(decrypted_output)
+    except Exception as e:
+        logging.error(f"An error occurred: {e}")

 if __name__ == "__main__":
-    logging.basicConfig(level=logging.INFO)
    main()
+