更新 mini支持讯飞中英文识别大模型，sant增加image对图像处理

2025-10-27 10:32:44 +08:00
parent f9d3427b20
commit d98b9fb0ed
4 changed files with 465 additions and 425 deletions
--- a/boards/default_src/micropython_esp32c2/origin/build/lib/mini_xunfei.py
+++ b/boards/default_src/micropython_esp32c2/origin/build/lib/mini_xunfei.py
@@ -45,7 +45,6 @@ class ASR_WebSocket(Ws_Param):
                        "domain": "iat",
                        "language": "zh_cn",
                        "accent": "mandarin",
-                        "vinfo": 1,
                        "vad_eos": 1000,
                        "nbest": 1,
                        "wbest": 1,
@@ -56,7 +55,10 @@ class ASR_WebSocket(Ws_Param):
        self.ws.settimeout(1000)

    def _frame(self, status, buf):
-        return {"status": status, "format": "audio/L16;rate=8000", "audio": str(b64encode(buf), 'utf-8'), "encoding": "raw"}
+        if status == 0:
+            return {"common": {"app_id": self.APPID}, "business": self.business, "data": {"status": status, "format": "audio/L16;rate=8000", "audio": str(b64encode(buf), 'utf-8'), "encoding": "raw"}}
+        else:
+            return {"data": {"status": status, "format": "audio/L16;rate=8000", "audio": str(b64encode(buf), 'utf-8'), "encoding": "raw"}}

    def on_message(self, message):
        result = ""
@@ -98,17 +100,16 @@ class ASR_WebSocket(Ws_Param):
                    if pace: print('=',end ="")
                    # 第一帧处理
                    if _state == 0:
-                        d = {"common": {"app_id": self.APPID}, "business": self.business, "data": self._frame(_state, buf)}
+                        d = self._frame(_state, buf)
                        _state = 1
                    # 中间帧处理 
                    else:
-                        d = {"data": self._frame(_state, buf)}
+                        d = self._frame(_state, buf)
                    self.ws.send(json.dumps(d))
-                    #print("------",len(buf), time.ticks_diff(time.ticks_ms(), _star))
                if time.ticks_diff(time.ticks_ms(), _star) > timeout:
                    raise OSError("Timeout pcm read error")
            # 最后一帧处理
-            d = {"data": self._frame(2, b'\x00')}
+            d = self._frame(2, b'\x00')
            self.ws.send(json.dumps(d))
            onboard_bot.pcm_en(False)  #PCM关闭
            if pace: print(']')
@@ -122,6 +123,45 @@ class ASR_WebSocket(Ws_Param):
            else:
                print("Run error: %s" % (e))

+#中英识别大模型
+class IAT_WebSocket(ASR_WebSocket):
+    def __init__(self, APPID, APIKey, APISecret, url='ws://iat.xf-yun.com/v1', accent="mandarin", res_id=None):
+        super().__init__(APPID, APIKey, APISecret, url)
+        self.res_id = res_id
+        self.business = {
+                        "domain": "slm",
+                        "language": "zh_cn",
+                        "accent": accent,
+                        "result": {
+                            "encoding": "utf8",
+                            "compress": "raw",
+                            "format": "plain"
+                        }
+                    }
+
+    def _frame(self, status, buf):
+        if status == 0:
+            return {"header": {"status": status, "app_id": self.APPID, "res_id": self.res_id}, "parameter": {"iat": self.business}, "payload": {"audio": { "audio": str(b64encode(buf), 'utf-8'), "sample_rate": 8000, "encoding": "raw"}}}
+        else:
+            return {"header": {"status": status, "app_id": self.APPID, "res_id": self.res_id}, "payload": {"audio": { "audio": str(b64encode(buf), 'utf-8'), "sample_rate": 8000, "encoding": "raw"}}}
+
+    def on_message(self, message):
+        result = ""
+        msg = json.loads(message)
+        code = msg['header']["code"]
+        if code != 0:
+            raise AttributeError("%s Code:%s" % (msg['header']["message"], code))
+        else:
+            if "payload" in msg:
+                text = msg["payload"]["result"]["text"]
+                data =  json.loads(b64decode(text).decode())['ws']
+                for i in data:
+                    for w in i["cw"]:
+                        result += w["w"]
+            if msg["header"]["status"]== 2:
+                return result, False
+        return result, True 
+
 #大模型
 class LLM_WebSocket(Ws_Param):
    Model_url = {
--- a/boards/default_src/micropython_esp32s3/origin/build/lib/camera.py
+++ b/boards/default_src/micropython_esp32s3/origin/build/lib/camera.py
@@ -5,18 +5,23 @@ MicroPython library for the Camera(Inherit C module)
 =======================================================
@dahanzimin From the Mixly Team
 """
-
 import time
-import base64
-import jpeg
 from _camera import *
-from jpeg import Encoder
+from base64 import b64encode
 from machine import SoftI2C, Pin
-from mixgo_sant import onboard_bot
+from jpeg import Encoder, Decoder

+class IMG:
+    def __init__(self, image, width, height):
+        self.image = image
+        self.width = width
+        self.height = height
+        self.format = "RGB565"

 class Camera(Camera):
    def __init__(self, frame_size=FrameSize.R240X240, pixel_format=PixelFormat.RGB565, hmirror=False, vflip=False, **kwargs):
+        from mixgo_sant import onboard_bot
+        onboard_bot.cam_reset(1, 0)
        onboard_bot.cam_en(1, 150)
        super().__init__(frame_size=frame_size, pixel_format=pixel_format, **kwargs)
        self.set_hmirror(not hmirror)
@@ -27,21 +32,42 @@ class Camera(Camera):

    def deinit(self):
        super().deinit()
+        onboard_bot.cam_reset(0, 0)
        onboard_bot.cam_en(0, 100)

-    def snapshot(self, path=None, formats=0, quality=90, rotation=0):
-        if formats == 0 and path is None:
+    def snapshot(self, path=None, quality=90, rotation=0):
+        if path is None:
            return self.capture()
        else:
-            _encoder = Encoder(pixel_format="RGB565_BE", quality=quality, rotation=rotation, width=self.get_pixel_width(), height=self.get_pixel_height())
-            _jpeg = _encoder.encode(self.capture())
-            del _encoder
-            if path is None:
-                if formats == 1:
-                    return _jpeg
-                else:
-                    return b'data:image/jpg;base64,' + base64.b64encode(_jpeg)
-            else:
-                with open(path, 'wb') as f:
-                    f.write(_jpeg)
-                return True
+            Image.save(self.capture(), path, quality, rotation)
+
+    def capture(self):
+        return IMG(super().capture(), self.get_pixel_width(), self.get_pixel_height())
+
+class Image:
+    def save(self, img, path="mixly.jpg", quality=90, rotation=0, **kwargs):
+        _encoder = Encoder(pixel_format="RGB565_BE", quality=quality, rotation=rotation, width=img.width, height=img.height, **kwargs)
+        _jpeg = _encoder.encode(img.image)
+        del _encoder
+        if isinstance(path, str):
+            with open(path, 'wb') as f:
+                f.write(_jpeg)
+        else:
+            return _jpeg
+
+    def open(self, path="mixly.jpg", rotation=0, **kwargs):
+        with open(path, "rb") as f:
+            _jpeg = f.read()
+        _decoder = Decoder(pixel_format="RGB565_BE", rotation=rotation, **kwargs)
+        _info = _decoder.get_img_info(_jpeg)
+        _image = IMG(_decoder.decode(_jpeg), _info[0], _info[1])
+        del _decoder
+        return _image
+
+    def convert(self, img, formats=0, **kwargs):
+        if formats == 0:
+            return self.save(img, None, **kwargs)
+        elif formats == 1:
+            return b'data:image/jpg;base64,' + b64encode(self.save(img, None, **kwargs))
+#图像处理
+Image = Image()
--- a/boards/default_src/micropython_esp32s3/origin/build/lib/mixgo_sant.py
+++ b/boards/default_src/micropython_esp32s3/origin/build/lib/mixgo_sant.py
@@ -1,18 +1,16 @@
 """
-mixgo_sant Onboard resources(v1.9)
+mixgo_sant Onboard resources(v2.0)

 Micropython library for the mixgo_sant Onboard resources
 =======================================================
-
@dahanzimin From the Mixly Team
 """
+import gc
+import time
+import math
+from machine import *
 from music import MIDI
 from ws2812x import NeoPixel
-from machine import *
-import time
-import gc
-import st7789_cf
-import math

 '''RTC'''
 rtc_clock = RTC()
@@ -33,6 +31,7 @@ except Exception as e:
    print("Warning: Failed to communicate with BOT035 (Coprocessor) or", e)

 '''TFT/240*240'''
+import st7789_cf
 onboard_tft = st7789_cf.ST7789(onboard_spi, 240, 240, dc_pin=45, reset=onboard_bot.tft_reset, backlight=onboard_bot.tft_brightness, font_address=0xF00000)

 '''ACC-Sensor'''
@@ -83,8 +82,6 @@ onboard_rgb = NeoPixel(onboard_bot.rgb_sync, 4)
 onboard_music = MIDI(46, pa_ctrl=onboard_bot.spk_en)

 '''5KEY_Sensor'''
-
-
 class KEYSensor:
    def __init__(self, pin, range):
        self.pin = pin
@@ -122,10 +119,7 @@ class KEYSensor:
    def irq(self, handler, trigger):
        Pin(self.pin, Pin.IN).irq(handler=handler, trigger=trigger)

-
 '''1KEY_Button'''
-
-
 class Button(KEYSensor):
    def __init__(self, pin):
        self.pin = pin
@@ -135,7 +129,6 @@ class Button(KEYSensor):
    def _value(self):
        return not self.key.value()

-
 B1key = Button(0)
 B2key = KEYSensor(17, 0)
 A1key = KEYSensor(17, 1600)
@@ -144,8 +137,6 @@ A3key = KEYSensor(17, 550)
 A4key = KEYSensor(17, 2100)

 '''2-LED'''
-
-
 class LED:
    def __init__(self, func):
        self._func = func
@@ -168,10 +159,8 @@ class LED:
    def getonoff(self, index):
        return True if self.getbrightness(index) > 50 else False

-
 onboard_led = LED(onboard_bot.led_pwm)

-
 class Voice_Energy:
    def read(self, samples=10):
        values = []
@@ -180,10 +169,8 @@ class Voice_Energy:
                0x08, 3)[:2], 'little'))  # 在语音识别里获取
        return sorted(values)[samples // 2]

-
 onboard_sound = Voice_Energy()

-
 class Clock:
    def __init__(self, x, y, radius, color, oled=onboard_tft):  # 定义时钟中心点和半径
        self.display = oled
@@ -254,6 +241,5 @@ class Clock:
    def clear(self, color=0):  # 清除
        self.display.ellipse(self.xc, self.yc, self.r, self.r, color, True)

-
 '''Reclaim memory'''
 gc.collect()
--- a/boards/default_src/micropython_esp32s3/origin/build/lib/st7789_cf.py
+++ b/boards/default_src/micropython_esp32s3/origin/build/lib/st7789_cf.py
@@ -8,24 +8,16 @@ MicroPython library for the ST7789(TFT-SPI)
 import time
 import uframebuf
 from machine import Pin
-from jpeg import Decoder
+from camera import Image, IMG
 from micropython import const

 _CMD_SWRESET 		= const(0x01)
-_CMD_SLPIN 			= const(0x10)
 _CMD_SLPOUT 		= const(0x11)
-_CMD_PTLON 			= const(0x12)
-_CMD_NORON 			= const(0x13)
-_CMD_INVOFF 		= const(0x20)
 _CMD_INVON 			= const(0x21)
-_CMD_DISPOFF 		= const(0x28)
 _CMD_DISPON 		= const(0x29)
 _CMD_CASET 			= const(0x2A)
 _CMD_RASET 			= const(0x2B)
 _CMD_RAMWR 			= const(0x2C)
-_CMD_RAMRD 			= const(0x2E)
-_CMD_PTLAR 			= const(0x30)
-_CMD_VSCRDEF 		= const(0x33)
 _CMD_COLMOD 		= const(0x3A)
 _CMD_MADCTL 		= const(0x36)

@@ -44,16 +36,12 @@ class ST7789(uframebuf.FrameBuffer_Uincode):

    def display(self, data=None, rotation=0, sync=True):
        if type(data) is str:
-            with open(data, "rb") as f:
-                _jpeg = f.read()
-            _decoder = Decoder(pixel_format="RGB565_BE", rotation=rotation)
-            self._buffer[:] = _decoder.decode(_jpeg)
-            del _decoder
-        else:
-            self._buffer[:] = data  # 后期做图像大小处理
-        if sync:
-            self.show()
-        return self._buffer
+            data = Image.open(data, rotation)
+        self._buffer[:] = data.image  # 后期做图像尺寸匹配处理
+        if sync: self.show()
+
+    def screenshot(self):
+        return IMG(memoryview(self._buffer), self.width, self.height)

    def _write(self, cmd, dat=None):
        self.dc.off()