src/server/internal/inference/voice_llm_client_test.go

961 bytes · 34 lines · capsule://quake0day/[email protected] raw on github

package inference

import "testing"

func TestVoiceLLMInputPBMapsImageFrame(t *testing.T) {
	req := voiceLLMInputPB(VoiceLLMInputEvent{
		Image: &ImageFrame{
			Data:        []byte{0xff, 0xd8, 0xff, 0x00},
			MimeType:    "image/jpeg",
			Width:       640,
			Height:      360,
			Source:      "screen",
			TimestampMS: 123,
			FrameSeq:    7,
		},
	})
	if req == nil {
		t.Fatal("expected request")
	}
	image := req.GetImage()
	if image == nil {
		t.Fatalf("expected image input, got %T", req.GetInput())
	}
	if string(image.GetData()) != string([]byte{0xff, 0xd8, 0xff, 0x00}) {
		t.Fatalf("unexpected image data: %v", image.GetData())
	}
	if image.GetMimeType() != "image/jpeg" || image.GetWidth() != 640 || image.GetHeight() != 360 {
		t.Fatalf("unexpected image metadata: %+v", image)
	}
	if image.GetSource() != "screen" || image.GetTimestampMs() != 123 || image.GetFrameSeq() != 7 {
		t.Fatalf("unexpected image source/timing metadata: %+v", image)
	}
}