/* blob.c - Alpine Package Keeper (APK) * * Copyright (C) 2005-2008 Natanael Copa * Copyright (C) 2008-2011 Timo Teräs * All rights reserved. * * This program is free software; you can redistribute it and/or modify it * under the terms of the GNU General Public License version 2 as published * by the Free Software Foundation. See http://www.gnu.org/ for details. */ #include #include #include #include "apk_blob.h" #include "apk_hash.h" struct apk_blob_atom { struct hlist_node hash_node; apk_blob_t blob; }; char *apk_blob_cstr(apk_blob_t blob) { char *cstr; if (blob.len == 0) return strdup(""); if (blob.ptr[blob.len-1] == 0) return strdup(blob.ptr); cstr = malloc(blob.len + 1); memcpy(cstr, blob.ptr, blob.len); cstr[blob.len] = 0; return cstr; } #if defined(__i386__) static unsigned long inline memspn( const unsigned char *ptr, unsigned long len, const unsigned char *array) { unsigned long p = len; __asm__("cld ; xorl %%eax, %%eax\n" "1:\n" "lodsb\n" "btl %%eax, %2\n" "jnc 2f\n" "decl %1\n" "jnz 1b\n" "2:\n" : "+&S" (ptr), "+&r" (p) : "m" (*array) : "cc", "%eax"); return p; } static unsigned long inline memcspn( const unsigned char *ptr, unsigned long len, const unsigned char *array) { unsigned long p = len; __asm__("cld ; xorl %%eax, %%eax\n" "1:\n" "lodsb\n" "btl %%eax, %2\n" "jc 2f\n" "decl %1\n" "jnz 1b\n" "2:\n" : "+&S" (ptr), "+&r" (p) : "m" (*array) : "cc", "%eax"); return p; } int apk_blob_spn(apk_blob_t blob, const apk_spn_match accept, apk_blob_t *l, apk_blob_t *r) { unsigned int i; if (blob.len == 0) return 0; i = blob.len - memspn((unsigned char*) blob.ptr, blob.len, accept); if (i == blob.len) return 0; if (l != NULL) *l = APK_BLOB_PTR_LEN(blob.ptr, i); if (r != NULL) *r = APK_BLOB_PTR_LEN(blob.ptr+i, blob.len-i); return 1; } int apk_blob_cspn(apk_blob_t blob, const apk_spn_match reject, apk_blob_t *l, apk_blob_t *r) { unsigned int i; if (blob.len == 0) return 0; i = blob.len - memcspn((unsigned char*) blob.ptr, blob.len, reject); if (i == blob.len) return 0; if (l != NULL) *l = APK_BLOB_PTR_LEN(blob.ptr, i); if (r != NULL) *r = APK_BLOB_PTR_LEN(blob.ptr+i, blob.len-i); return 1; } #else static int inline test_bit(const unsigned char *array, unsigned bit) { return array[bit >> 3] & (1 << (bit & 7)); } int apk_blob_spn(apk_blob_t blob, const apk_spn_match accept, apk_blob_t *l, apk_blob_t *r) { int i; for (i = 0; i < blob.len; i++) { if (!test_bit(accept, blob.ptr[i])) { if (l != NULL) *l = APK_BLOB_PTR_LEN(blob.ptr, i); if (r != NULL) *r = APK_BLOB_PTR_LEN(blob.ptr+i, blob.len-i); return 1; } } return 0; } int apk_blob_cspn(apk_blob_t blob, const apk_spn_match reject, apk_blob_t *l, apk_blob_t *r) { int i; for (i = 0; i < blob.len; i++) { if (test_bit(reject, blob.ptr[i])) { if (l != NULL) *l = APK_BLOB_PTR_LEN(blob.ptr, i); if (r != NULL) *r = APK_BLOB_PTR_LEN(blob.ptr+i, blob.len-i); return 1; } } return 0; } #endif int apk_blob_rsplit(apk_blob_t blob, char split, apk_blob_t *l, apk_blob_t *r) { char *sep; sep = memrchr(blob.ptr, split, blob.len); if (sep == NULL) return 0; if (l != NULL) *l = APK_BLOB_PTR_PTR(blob.ptr, sep - 1); if (r != NULL) *r = APK_BLOB_PTR_PTR(sep + 1, blob.ptr + blob.len - 1); return 1; } int apk_blob_split(apk_blob_t blob, apk_blob_t split, apk_blob_t *l, apk_blob_t *r) { char *pos = blob.ptr, *end = blob.ptr + blob.len - split.len + 1; if (end < pos) return 0; while (1) { pos = memchr(pos, split.ptr[0], end - pos); if (pos == NULL) return 0; if (split.len > 1 && memcmp(pos, split.ptr, split.len) != 0) { pos++; continue; } *l = APK_BLOB_PTR_PTR(blob.ptr, pos-1); *r = APK_BLOB_PTR_PTR(pos+split.len, blob.ptr+blob.len-1); return 1; } } apk_blob_t apk_blob_pushed(apk_blob_t buffer, apk_blob_t left) { if (buffer.ptr + buffer.len != left.ptr + left.len) return APK_BLOB_NULL; return APK_BLOB_PTR_LEN(buffer.ptr, left.ptr - buffer.ptr); } static uint32_t murmur3_32(const char *key, uint32_t len, uint32_t seed) { static const uint32_t c1 = 0xcc9e2d51; static const uint32_t c2 = 0x1b873593; static const uint32_t r1 = 15; static const uint32_t r2 = 13; static const uint32_t m = 5; static const uint32_t n = 0xe6546b64; uint32_t hash = seed; const int nblocks = len / 4; const uint32_t *blocks = (const uint32_t *) key; int i; for (i = 0; i < nblocks; i++) { uint32_t k = blocks[i]; k *= c1; k = (k << r1) | (k >> (32 - r1)); k *= c2; hash ^= k; hash = ((hash << r2) | (hash >> (32 - r2))) * m + n; } const uint8_t *tail = (const uint8_t *) (key + nblocks * 4); uint32_t k1 = 0; switch (len & 3) { case 3: k1 ^= tail[2] << 16; case 2: k1 ^= tail[1] << 8; case 1: k1 ^= tail[0]; k1 *= c1; k1 = (k1 << r1) | (k1 >> (32 - r1)); k1 *= c2; hash ^= k1; } hash ^= len; hash ^= (hash >> 16); hash *= 0x85ebca6b; hash ^= (hash >> 13); hash *= 0xc2b2ae35; hash ^= (hash >> 16); return hash; } unsigned long apk_blob_hash_seed(apk_blob_t blob, unsigned long seed) { return murmur3_32(blob.ptr, blob.len, seed); } unsigned long apk_blob_hash(apk_blob_t blob) { return apk_blob_hash_seed(blob, 5381); } int apk_blob_compare(apk_blob_t a, apk_blob_t b) { if (a.len == b.len) return memcmp(a.ptr, b.ptr, a.len); if (a.len < b.len) return -1; return 1; } int apk_blob_ends_with(apk_blob_t a, apk_blob_t b) { if (a.len < b.len) return 0; return memcmp(a.ptr+a.len-b.len, b.ptr, b.len) == 0; } int apk_blob_for_each_segment(apk_blob_t blob, const char *split, int (*cb)(void *ctx, apk_blob_t blob), void *ctx) { apk_blob_t l, r, s = APK_BLOB_STR(split); int rc; r = blob; while (apk_blob_split(r, s, &l, &r)) { rc = cb(ctx, l); if (rc != 0) return rc; } if (r.len > 0) return cb(ctx, r); return 0; } static unsigned char digitdecode[] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0x3e, 0xff, 0xff, 0xff, 0xff, 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 0xff, 0xff, 0xff, 0x00, 0xff, 0xff, 0xff, 0xa, 0xb, 0xc, 0xd, 0xe, 0xf, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xa, 0xb, 0xc, 0xd, 0xe, 0xf, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, }; static inline int dx(unsigned char c) { return digitdecode[c]; } void apk_blob_push_blob(apk_blob_t *to, apk_blob_t literal) { if (unlikely(APK_BLOB_IS_NULL(*to))) return; if (unlikely(to->len < literal.len)) { *to = APK_BLOB_NULL; return; } memcpy(to->ptr, literal.ptr, literal.len); to->ptr += literal.len; to->len -= literal.len; } static const char *xd = "0123456789abcdefghijklmnopqrstuvwxyz"; void apk_blob_push_uint(apk_blob_t *to, unsigned int value, int radix) { char buf[64]; char *ptr = &buf[sizeof(buf)-1]; if (value == 0) { apk_blob_push_blob(to, APK_BLOB_STR("0")); return; } while (value != 0) { *(ptr--) = xd[value % radix]; value /= radix; } apk_blob_push_blob(to, APK_BLOB_PTR_PTR(ptr+1, &buf[sizeof(buf)-1])); } void apk_blob_push_csum(apk_blob_t *to, struct apk_checksum *csum) { switch (csum->type) { case APK_CHECKSUM_MD5: apk_blob_push_hexdump(to, APK_BLOB_CSUM(*csum)); break; case APK_CHECKSUM_SHA1: apk_blob_push_blob(to, APK_BLOB_STR("Q1")); apk_blob_push_base64(to, APK_BLOB_CSUM(*csum)); break; default: *to = APK_BLOB_NULL; break; } } void apk_blob_push_hexdump(apk_blob_t *to, apk_blob_t binary) { char *d; int i; if (unlikely(APK_BLOB_IS_NULL(*to))) return; if (unlikely(to->len < binary.len * 2)) { *to = APK_BLOB_NULL; return; } for (i = 0, d = to->ptr; i < binary.len; i++) { *(d++) = xd[(binary.ptr[i] >> 4) & 0xf]; *(d++) = xd[binary.ptr[i] & 0xf]; } to->ptr = d; to->len -= binary.len * 2; } static const char b64encode[] = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"; static inline void push_b64_chunk(unsigned char *to, const unsigned char *from, int len) { to[0] = b64encode[from[0] >> 2]; to[1] = b64encode[((from[0] & 0x03) << 4) | ((from[1] & 0xf0) >> 4)]; to[2] = len < 2 ? '=' : b64encode[((from[1] & 0x0f) << 2) | ((from[2] & 0xc0) >> 6)]; to[3] = len < 3 ? '=' : b64encode[from[2] & 0x3f ]; } void apk_blob_push_base64(apk_blob_t *to, apk_blob_t binary) { unsigned char *src = (unsigned char *) binary.ptr; unsigned char *dst = (unsigned char *) to->ptr; int i, needed; if (unlikely(APK_BLOB_IS_NULL(*to))) return; needed = ((binary.len + 2) / 3) * 4; if (unlikely(to->len < needed)) { *to = APK_BLOB_NULL; return; } for (i = 0; i < binary.len / 3; i++, src += 3, dst += 4) push_b64_chunk(dst, src, 4); i = binary.len % 3; if (i != 0) push_b64_chunk(dst, src, i); to->ptr += needed; to->len -= needed; } void apk_blob_pull_char(apk_blob_t *b, int expected) { if (unlikely(APK_BLOB_IS_NULL(*b))) return; if (unlikely(b->len < 1 || b->ptr[0] != expected)) { *b = APK_BLOB_NULL; return; } b->ptr ++; b->len --; } unsigned int apk_blob_pull_uint(apk_blob_t *b, int radix) { unsigned int val; int ch; val = 0; while (b->len && b->ptr[0] != 0) { ch = dx(b->ptr[0]); if (ch >= radix) break; val *= radix; val += ch; b->ptr++; b->len--; } return val; } void apk_blob_pull_csum(apk_blob_t *b, struct apk_checksum *csum) { int encoding; if (unlikely(APK_BLOB_IS_NULL(*b))) return; if (unlikely(b->len < 2)) { *b = APK_BLOB_NULL; return; } if (dx(b->ptr[0]) != 0xff) { /* Assume MD5 for backwards compatibility */ csum->type = APK_CHECKSUM_MD5; apk_blob_pull_hexdump(b, APK_BLOB_CSUM(*csum)); return; } encoding = b->ptr[0]; switch (b->ptr[1]) { case '1': csum->type = APK_CHECKSUM_SHA1; break; default: *b = APK_BLOB_NULL; return; } b->ptr += 2; b->len -= 2; switch (encoding) { case 'X': apk_blob_pull_hexdump(b, APK_BLOB_CSUM(*csum)); break; case 'Q': apk_blob_pull_base64(b, APK_BLOB_CSUM(*csum)); break; default: *b = APK_BLOB_NULL; break; } } void apk_blob_pull_hexdump(apk_blob_t *b, apk_blob_t to) { char *s, *d; int i, r, r1, r2; if (unlikely(APK_BLOB_IS_NULL(*b))) return; if (unlikely(to.len > b->len * 2)) goto err; r = 0; for (i = 0, s = b->ptr, d = to.ptr; i < to.len; i++) { r |= r1 = dx(*(s++)); r |= r2 = dx(*(s++)); *(d++) = (r1 << 4) + r2; } if (unlikely(r == 0xff)) goto err; b->ptr = s; b->len -= to.len * 2; return; err: *b = APK_BLOB_NULL; } int apk_blob_pull_blob_match(apk_blob_t *b, apk_blob_t match) { if (b->len < match.len) return 0; if (memcmp(b->ptr, match.ptr, match.len) != 0) return 0; b->ptr += match.len; b->len -= match.len; return 1; } static unsigned char b64decode[] = { 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0x3e, 0xff, 0xff, 0xff, 0x3f, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0xff, 0xff, 0xff, 0x00, 0xff, 0xff, 0xff, 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f, 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, 0x18, 0x19, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f, 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27, 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f, 0x30, 0x31, 0x32, 0x33, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, 0xff, }; static inline __attribute__((always_inline)) int pull_b64_chunk(unsigned char *restrict to, const unsigned char *restrict from, int len) { unsigned char tmp[4]; int i, r = 0; for (i = 0; i < 4; i++) { tmp[i] = b64decode[from[i]]; r |= tmp[i]; } if (unlikely(r == 0xff)) return -1; to[0] = (tmp[0] << 2 | tmp[1] >> 4); if (len > 1) to[1] = (tmp[1] << 4 | tmp[2] >> 2); else if (unlikely(from[2] != '=')) return -1; if (len > 2) to[2] = (((tmp[2] << 6) & 0xc0) | tmp[3]); else if (unlikely(from[3] != '=')) return -1; return 0; } void apk_blob_pull_base64(apk_blob_t *b, apk_blob_t to) { unsigned char tmp[4]; unsigned char *restrict src = (unsigned char *) b->ptr; unsigned char *restrict dst = (unsigned char *) to.ptr; unsigned char *dend; int r, needed; if (unlikely(APK_BLOB_IS_NULL(*b))) return; needed = ((to.len + 2) / 3) * 4; if (unlikely(b->len < needed)) goto err; r = 0; dend = dst + to.len - 2; for (; dst < dend; src += 4, dst += 3) { r |= tmp[0] = b64decode[src[0]]; r |= tmp[1] = b64decode[src[1]]; r |= tmp[2] = b64decode[src[2]]; r |= tmp[3] = b64decode[src[3]]; dst[0] = (tmp[0] << 2 | tmp[1] >> 4); dst[1] = (tmp[1] << 4 | tmp[2] >> 2); dst[2] = (((tmp[2] << 6) & 0xc0) | tmp[3]); } if (unlikely(r == 0xff)) goto err; dend += 2; if (dst != dend && pull_b64_chunk(dst, src, dend - dst) != 0) goto err; b->ptr += needed; b->len -= needed; return; err: *b = APK_BLOB_NULL; } static apk_blob_t atom_hash_get_key(apk_hash_item item) { return ((struct apk_blob_atom *) item)->blob; } static struct apk_hash atom_hash; static struct apk_hash_ops atom_ops = { .node_offset = offsetof(struct apk_blob_atom, hash_node), .get_key = atom_hash_get_key, .hash_key = apk_blob_hash, .compare = apk_blob_compare, .delete_item = (apk_hash_delete_f) free, }; apk_blob_t apk_null_blob = {0,0}; #ifdef VALGRIND static void apk_atom_fini(void) { apk_hash_free(&atom_hash); } #endif void apk_atom_init(void) { #ifdef VALGRIND atexit(apk_atom_fini); #endif apk_hash_init(&atom_hash, &atom_ops, 10000); } apk_blob_t *apk_blob_atomize(apk_blob_t blob) { struct apk_blob_atom *atom; unsigned long hash = apk_hash_from_key(&atom_hash, blob); if (blob.len < 0 || blob.ptr == NULL) return &apk_null_blob; atom = (struct apk_blob_atom *) apk_hash_get_hashed(&atom_hash, blob, hash); if (atom != NULL) return &atom->blob; atom = malloc(sizeof(*atom)); atom->blob = blob; apk_hash_insert_hashed(&atom_hash, atom, hash); return &atom->blob; } apk_blob_t *apk_blob_atomize_dup(apk_blob_t blob) { struct apk_blob_atom *atom; unsigned long hash = apk_hash_from_key(&atom_hash, blob); char *ptr; if (blob.len < 0 || blob.ptr == NULL) return &apk_null_blob; atom = (struct apk_blob_atom *) apk_hash_get_hashed(&atom_hash, blob, hash); if (atom != NULL) return &atom->blob; atom = malloc(sizeof(*atom) + blob.len); ptr = (char*) (atom + 1); memcpy(ptr, blob.ptr, blob.len); atom->blob = APK_BLOB_PTR_LEN(ptr, blob.len); apk_hash_insert_hashed(&atom_hash, atom, hash); return &atom->blob; }