emscripten/tests/benchmark_utf16.cpp

68 строки
2.1 KiB
C++

// Copyright 2016 The Emscripten Authors. All rights reserved.
// Emscripten is available under two separate licenses, the MIT license and the
// University of Illinois/NCSA Open Source License. Both these licenses can be
// found in the LICENSE file.
#include <stdio.h>
#include <string.h>
#include <wchar.h>
#include <iostream>
#include <cassert>
#include <emscripten.h>
double test(const unsigned short *str) {
double res = EM_ASM_DOUBLE({
var t0 = _emscripten_get_now();
var str = Module.UTF16ToString($0);
var t1 = _emscripten_get_now();
out('t: ' + (t1 - t0) + ', len(result): ' + str.length + ', result: ' + str.slice(0, 100));
return (t1-t0);
}, str);
return res;
}
unsigned short *utf16_corpus = 0;
long utf16_corpus_length = 0;
unsigned short *randomString(int len) {
if (!utf16_corpus) {
// FILE *handle = fopen("ascii_corpus.txt", "rb");
FILE *handle = fopen("utf16_corpus.txt", "rb");
fseek(handle, 0, SEEK_END);
utf16_corpus_length = ftell(handle)/2;
assert(utf16_corpus_length > 0);
utf16_corpus = new unsigned short[utf16_corpus_length+1];
fseek(handle, 0, SEEK_SET);
fread(utf16_corpus, 2, utf16_corpus_length, handle);
fclose(handle);
utf16_corpus[utf16_corpus_length] = 0;
}
int startIdx = rand() % (utf16_corpus_length - len);
while((utf16_corpus[startIdx] & 0xFF00) == 0xDC00) {
++startIdx;
if (startIdx + len > utf16_corpus_length) len = utf16_corpus_length - startIdx;
}
assert(len > 0);
unsigned short *s = new unsigned short[len+1];
memcpy(s, utf16_corpus + startIdx, len*2);
s[len] = 0;
while(((unsigned short)s[len-1] & 0xFF00) == 0xD800) { s[--len] = 0; }
assert(len >= 0);
return s;
}
int main() {
srand(time(NULL));
double t = 0;
double t2 = emscripten_get_now();
for(int i = 0; i < 10; ++i) {
// FF Nightly: Already on small strings of 64 bytes in length, TextDecoder trumps in performance.
unsigned short *str = randomString(100);
t += test(str);
delete [] str;
}
double t3 = emscripten_get_now();
printf("OK. Time: %f (%f).\n", t, t3-t2);
return 0;
}