⚡ Support for model meta-llama-3.1-405b-instruct

MrGraversen · MrGraversen · commit 3c82818cfdc6 · 2024-11-01T11:25:18.000+01:00
diff --git a/spring-boot-starter-replicate/src/main/java/io/graversen/replicate/llama3/Llama3Models.java b/spring-boot-starter-replicate/src/main/java/io/graversen/replicate/llama3/Llama3Models.java
@@ -5,6 +5,7 @@
 
 @UtilityClass
 public class Llama3Models {
+    public static final ReplicateModel LLAMA_3_1_405B_INSTRUCT = new ReplicateModel("meta", "meta-llama-3.1-405b-instruct");
     public static final ReplicateModel LLAMA_3_70B_INSTRUCT = new ReplicateModel("meta", "meta-llama-3-70b-instruct");
     public static final ReplicateModel LLAMA_3_8B_INSTRUCT = new ReplicateModel("meta", "meta-llama-3-8b-instruct");
 }
diff --git a/spring-boot-starter-replicate/src/main/java/io/graversen/replicate/llama3/Llama3PredictionMapper.java b/spring-boot-starter-replicate/src/main/java/io/graversen/replicate/llama3/Llama3PredictionMapper.java
@@ -3,10 +3,7 @@
 import io.graversen.replicate.common.BasePredictionMapper;
 import io.graversen.replicate.common.PredictionTypes;
 import io.graversen.replicate.common.ReplicateModel;
-import io.graversen.replicate.models.MetaMetaLlama370BInstructInput;
-import io.graversen.replicate.models.MetaMetaLlama370BInstructPredictionrequest;
-import io.graversen.replicate.models.MetaMetaLlama38BInstructInput;
-import io.graversen.replicate.models.MetaMetaLlama38BInstructPredictionrequest;
+import io.graversen.replicate.models.*;
 import io.graversen.replicate.service.CreateTextPrediction;
 import lombok.NonNull;
 import org.springframework.stereotype.Component;
@@ -19,6 +16,7 @@ public class Llama3PredictionMapper extends BasePredictionMapper<CreateTextPredi
     @Override
     protected Set<ReplicateModel> supportedModels() {
         return Set.of(
+                Llama3Models.LLAMA_3_1_405B_INSTRUCT,
                 Llama3Models.LLAMA_3_70B_INSTRUCT,
                 Llama3Models.LLAMA_3_8B_INSTRUCT
         );
@@ -44,6 +42,15 @@ public Object apply(@NonNull ReplicateModel model, @NonNull CreateTextPrediction
                     null,
                     null
             );
+        } else if (model.equals(Llama3Models.LLAMA_3_1_405B_INSTRUCT)) {
+            return new MetaMetaLlama31405BInstructPredictionrequest(
+                    null,
+                    mapLlama31405bInput().apply(createPrediction),
+                    null,
+                    null,
+                    null,
+                    null
+            );
         } else {
             throw new IllegalArgumentException("Unsupported Replicate Model: " + model);
         }
@@ -54,6 +61,27 @@ public boolean supportsType(@NonNull PredictionTypes type) {
         return PredictionTypes.TEXT.equals(type);
     }
 
+    Function<CreateTextPrediction, MetaMetaLlama31405BInstructInput> mapLlama31405bInput() {
+        return createTextPrediction -> {
+            final var conversation = createTextPrediction.getConversation();
+            final var truncatedConversation = Llama3Tokenizer.fitToContextWindow(conversation, Llama3Tokenizer.DEFAULT_CONTEXT_WINDOW_SIZE);
+            final var textCompletion = Llama3Tokenizer.generateTextCompletion(truncatedConversation);
+
+            return new MetaMetaLlama31405BInstructInput(
+                    createTextPrediction.getTopK(),
+                    createTextPrediction.getTopP(),
+                    textCompletion.getText(),
+                    createTextPrediction.getMaxTokens(),
+                    createTextPrediction.getMinTokens(),
+                    createTextPrediction.getTemperature(),
+                    truncatedConversation.getSystemMessage(),
+                    null,
+                    null,
+                    null
+            );
+        };
+    }
+
     Function<CreateTextPrediction, MetaMetaLlama370BInstructInput> mapLlama370bInput() {
         return createTextPrediction -> {
             final var conversation = createTextPrediction.getConversation();

Original file line number	Diff line number	Diff line change
`@@ -5,6 +5,7 @@`
`5`	`5`
`6`	`6`	`@UtilityClass`
`7`	`7`	`public class Llama3Models {`
	`8`	`+ public static final ReplicateModel LLAMA_3_1_405B_INSTRUCT = new ReplicateModel("meta", "meta-llama-3.1-405b-instruct");`
`8`	`9`	`public static final ReplicateModel LLAMA_3_70B_INSTRUCT = new ReplicateModel("meta", "meta-llama-3-70b-instruct");`
`9`	`10`	`public static final ReplicateModel LLAMA_3_8B_INSTRUCT = new ReplicateModel("meta", "meta-llama-3-8b-instruct");`
`10`	`11`	`}`