added multiline id3v2 frames support

author: Alexey Yakovenko <wakeroid@gmail.com> 2010-04-05 19:59:33 +0200
committer: Alexey Yakovenko <wakeroid@gmail.com> 2010-04-05 19:59:33 +0200
commit: fb8fc73d1012451a91df0e68435b30b68fb8020a (patch)
tree: a7f0210ba028a55ea169a0f0d384c9dc5001788c /junklib.c
parent: 4de59f6b45b6e71df9fda01ae9d1ed356d3eae98 (diff)
1 files changed, 44 insertions, 25 deletions
diff --git a/junklib.c b/junklib.c
index b781f7cf..ce7d0149 100644
--- a/junklib.c
+++ b/junklib.c
@@ -314,21 +314,31 @@ can_be_russian (const signed char *str) {
 
 static char *
 convstr_id3v2 (int version, uint8_t encoding, const unsigned char* str, int sz) {
-    static char out[2048];
-    const char *enc = "iso8859-1";
+    char out[2048] = "";
+    const char *enc = NULL;
 
-    if (version == 4 && encoding == 3) {
-        // utf8
-        trace ("utf8\n");
-        strncpy (out, str, 2047);
-        out[min (sz, 2047)] = 0;
-        return strdup (out);
-    }
-    else if (version == 4 && encoding == 2) {
+    // detect encoding
+    if (version == 4 && encoding == 2) {
         trace ("utf16be\n");
         enc = "UTF-16BE";
     }
-    else if (encoding == 1) {
+    else if (version == 4 && encoding == 3) {
+        enc = UTF8;
+    }
+    else if (encoding == 0) {
+        // hack to add limited cp1251 recoding support
+        if (can_be_russian (str)) {
+            enc = "cp1251";
+        }
+    }
+    else if (encoding != 1 && !(version == 4 && encoding == 3)){
+        return NULL; // invalid encoding
+    }
+
+    if (encoding == 1) { // detect kind of unicode used
+        if (sz < 2) {
+            return NULL;
+        }
         if (version < 4) {
             if (str[0] == 0xff && str[1] == 0xfe) {
                 enc = "UCS-2LE";
@@ -350,32 +360,34 @@ convstr_id3v2 (int version, uint8_t encoding, const unsigned char* str, int sz)
             enc = "UTF-16";
         }
     }
-#if 0
-    // NOTE: some dumb taggers put non-iso8859-1 text with enc=0
-    else if (*str == 0) {
-        // iso8859-1
-        trace ("iso8859-1\n");
-        enc = "iso8859-1";
-    }
-#endif
     else if (encoding == 0) {
         // hack to add limited cp1251 recoding support
         if (can_be_russian (str)) {
             enc = "cp1251";
         }
+        else {
+            enc = "iso8859-1";
+        }
     }
-    else {
-        return 0; // invalid encoding
+
+    int converted_sz = 0;
+
+    if ((converted_sz = junk_iconv (str, sz, out, sizeof (out), enc, UTF8)) < 0) {
+        return NULL;
     }
-    if (junk_iconv (str, sz, out, sizeof (out), enc, UTF8) > 0) {
-        trace ("converted: %s\n", out);
-        return strdup (out);
+    else {
+        for (int n = 0; n < converted_sz; n++) {
+            if (out[n] == 0 && n != converted_sz-1) {
+                out[n] = '\n';
+            }
+        }
     }
-    return NULL;
+    return strdup (out);
 }
 
 static const char *
 convstr_id3v1 (const char* str, int sz) {
+    trace ("convstr_id3v1\n");
     static char out[2048];
     int i;
     for (i = 0; i < sz; i++) {
@@ -2441,7 +2453,14 @@ junk_id3v2_read_full (playItem_t *it, DB_id3v2_tag_t *tag_store, DB_FILE *fp) {
                         trace ("frame %s is too big, discard\n", frameid);
                         break;
                     }
+
                     char *text = convstr_id3v2 (version_major, readptr[0], readptr+1, synched_size-1);
+
+                    // couple of simple tests
+                    //char *text = convstr_id3v2 (4, 3, "текст1\0текст2", strlen ("текст1")*2+2);
+                    //const char ucstext[] = { 0x42, 0x04, 0x35, 0x04, 0x3a, 0x04, 0x41, 0x04, 0x42, 0x04, 0x31, 0x00, 0x00, 0x00, 0x42, 0x04, 0x35, 0x04, 0x3a, 0x04, 0x41, 0x04, 0x42, 0x04, 0x32, 0x00 };
+                    //char *text = convstr_id3v2 (4, 1, ucstext, sizeof (ucstext));
+
                     if (text && *text && text_holders[f]) {
                         if (*text_holders[f]) {
                             // append
author	Alexey Yakovenko <wakeroid@gmail.com>	2010-04-05 19:59:33 +0200
committer	Alexey Yakovenko <wakeroid@gmail.com>	2010-04-05 19:59:33 +0200
commit	fb8fc73d1012451a91df0e68435b30b68fb8020a (patch)
tree	a7f0210ba028a55ea169a0f0d384c9dc5001788c /junklib.c
parent	4de59f6b45b6e71df9fda01ae9d1ed356d3eae98 (diff)