Merge pull request #12 from dave-gray101/llama2

"LLAMA2 Chat" model gallery base model
go-skynet · Jul 25, 2023 · 51b8acf · 51b8acf
2 parents 04cfebd + ee5c5a1
commit 51b8acf
Show file tree

Hide file tree

Showing 4 changed files with 136 additions and 25 deletions.
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,3 @@
+model-gallery
+model-gallery.exe
+_test.yaml
diff --git a/llama2-chat.yaml b/llama2-chat.yaml
@@ -0,0 +1,33 @@
+name: "llama2-13b-chat"
+
+description: |
+Llama 2 13B Chat -> Llama 2 is a collection of pretrained and fine-tuned generative text models ranging in scale from 7 billion to 70 billion parameters. 
+
+license: "https://ai.meta.com/llama/license/"
+urls:
+- https://ai.meta.com/llama/
+
+config_file: |
+  name: llama2-13b-chat
+  backend: "llama"
+  parameters:
+    top_k: 80
+    temperature: 0.2
+    top_p: 0.7
+  context_size: 4096
+  template:
+    chat_message: llama2-chat-message
+  system_prompt: |
+    You are a helpful, respectful and honest assistant. Always answer as helpfully as possible, while being safe.  Your answers should not include any harmful, unethical, racist, sexist, toxic, dangerous, or illegal content. Please ensure that your responses are socially unbiased and positive in nature.
+    If a question does not make any sense, or is not factually coherent, explain why instead of answering something not correct. If you don't know the answer to a question, please don't share false information.
+
+prompt_templates:
+- name: "llama2-chat-message"
+  content: |
+    {{if eq .RoleName "assistant"}}{{.Content}}{{else}}
+    [INST]
+    {{if .SystemPrompt}}{{.SystemPrompt}}{{else if eq .RoleName "system"}}<<SYS>>{{.Content}}<</SYS>>
+
+    {{else if .Content}}{{.Content}}{{end}}
+    [/INST] 
+    {{end}}
diff --git a/main.go b/main.go
@@ -23,18 +23,73 @@ const indexFile = "huggingface.yaml"
 var baseGalleryURL string = "github:go-skynet/model-gallery"
 var baseConfig string = baseGalleryURL + "/base.yaml"
 
-var baseURLs map[string]string = map[string]string{
-	// This maps the key to a file into the repository
-	"koala":       "koala",
-	"manticore":   "manticore",
-	"vicuna":      "vicuna",
-	"airoboros":   "airoboros",
-	"hypermantis": "hypermantis",
-	"guanaco":     "guanaco",
-	"openllama":   "openllama_3b",
-	"rwkv":        "rwkv-raven-1b",
-	"wizard":      "wizard",
-	"hippogriff":  "hippogriff",
+func StripErrorFromPointer[T any](value *T, errs ...error) *T {
+	if len(errs) > 0 && errs[0] != nil {
+		return nil
+	}
+	return value
+}
+
+type BaseDefinition struct {
+	Name  string
+	Path  string
+	Match *regexp.Regexp
+}
+
+// Currently these are matched top to bottom, with a break statement.
+// What that means is if a model is named something like "LLama-Koala-Manticore-Wizard", whichever of those currently appears first in this list will "win".
+// TODO: do we need a more sophisticated model than this?
+// TODO: is the current list order even correct!
+var baseDefinitions []BaseDefinition = []BaseDefinition{
+	{
+		Name: "koala",
+		Path: "koala",
+	},
+	{
+		Name: "koala",
+		Path: "koala",
+	},
+	{
+		Name: "manticore",
+		Path: "manticore",
+	},
+	{
+		Name: "vicuna",
+		Path: "vicuna",
+	},
+	{
+		Name: "airoboros",
+		Path: "airoboros",
+	},
+	{
+		Name: "hypermantis",
+		Path: "hypermantis",
+	},
+	{
+		Name: "guanaco",
+		Path: "guanaco",
+	},
+	{
+		Name: "openllama",
+		Path: "openllama_3b",
+	},
+	{
+		Name: "rwkv",
+		Path: "rwkv-raven-1b",
+	},
+	{
+		Name: "wizard",
+		Path: "wizard",
+	},
+	{
+		Name: "hippogriff",
+		Path: "hippogriff",
+	},
+	{
+		Name:  "llama2-chat",
+		Path:  "llama2-chat",
+		Match: StripErrorFromPointer(regexp.Compile(`llama-*2-*([\d]+b)?-*chat`)),
+	},
 }
 
 type Model struct {
@@ -80,13 +135,13 @@ func getSHA256(url string) (string, error) {
 
 	resp, err := http.Get(url)
 	if err != nil {
-		return "", fmt.Errorf("Failed to fetch the web page: %v\n", err)
+		return "", fmt.Errorf("failed to fetch the web page: %v\n", err)
 	}
 	defer resp.Body.Close()
 
 	htmlData, err := ioutil.ReadAll(resp.Body)
 	if err != nil {
-		return "", fmt.Errorf("Failed to read the response body: %v\n", err)
+		return "", fmt.Errorf("failed to read the response body: %v\n", err)
 	}
 
 	shaRegex := regexp.MustCompile(`(?s)<strong>SHA256:</strong>\s+(.+?)</li>`)
@@ -190,12 +245,20 @@ func scraperWorker(wg *sync.WaitGroup, c chan string, g chan GalleryModel) {
 		for _, m := range mm.Files {
 			url := baseConfig
 
-			for k, v := range baseURLs {
-				// Check if the model name or ID contains the key
-				// TODO: This is a bit hacky, we should probably use a regex(?)
-				if strings.Contains(strings.ToLower(m.Filename), k) || strings.Contains(strings.ToLower(model), k) {
-					url = fmt.Sprintf("%s/%s.yaml", baseGalleryURL, v)
-					break
+			for _, v := range baseDefinitions {
+				// Check if the model name or filename matches this baseDefinition
+				if v.Match != nil {
+					// If an explicit Match regex exists, prefer that.
+					if v.Match.MatchString((strings.ToLower(m.Filename))) || v.Match.MatchString((strings.ToLower(model))) { // TODO Do we need anything fancier than a boolean match? Might be interesting to capture group the # of parameters and feed that into a template somehow...
+						url = fmt.Sprintf("%s/%s.yaml", baseGalleryURL, v.Path)
+						break
+					}
+				} else {
+					// Otherwise, fallback on the existing string match
+					if strings.Contains(strings.ToLower(m.Filename), v.Name) || strings.Contains(strings.ToLower(model), v.Name) {
+						url = fmt.Sprintf("%s/%s.yaml", baseGalleryURL, v.Path)
+						break
+					}
 				}
 			}
 
@@ -218,7 +281,7 @@ func scraperWorker(wg *sync.WaitGroup, c chan string, g chan GalleryModel) {
 	}
 }
 
-func scrapeHuggingFace(term string, concurrency int) {
+func scrapeHuggingFace(term string, concurrency int, indexFile string) {
 	// Step 1: Get a list of all models
 	resp, err := http.Get(fmt.Sprintf("https://huggingface.co/api/models?search=%s", term))
 	if err != nil {
@@ -281,15 +344,18 @@ func scrapeHuggingFace(term string, concurrency int) {
 
 }
 
+func parallelSearch(terms []string, concurrency int, indexFile string) {
+	for _, term := range terms {
+		scrapeHuggingFace(term, concurrency, indexFile)
+	}
+}
+
 func main() {
 	concurrency := 10
 	c := os.Getenv("CONCURRENCY")
 	parallelism, err := strconv.Atoi(c)
 	if err == nil {
 		concurrency = parallelism
 	}
-
-	for _, term := range []string{"TheBloke", "ggml"} {
-		scrapeHuggingFace(term, concurrency)
-	}
+	parallelSearch([]string{"TheBloke", "ggml"}, concurrency, indexFile)
 }
diff --git a/main_test.go b/main_test.go
@@ -0,0 +1,9 @@
+package main
+
+import (
+	"testing"
+)
+
+func TestSmallSearch(t *testing.T) {
+	parallelSearch([]string{"Llama-2-13B-chat-GGML"}, 1, "_test.yaml")
+}