|
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949 |
- // Copyright 2021 Tencent
- // SPDX-License-Identifier: BSD-3-Clause
-
- #include "mat.h"
-
- #include <ctype.h>
- #include <limits.h>
-
- #if __ARM_NEON
- #include <arm_neon.h>
- #endif // __ARM_NEON
-
- #if __SSE2__
- #include <emmintrin.h>
- #endif
-
- #include "platform.h"
-
- namespace ncnn {
-
- #if NCNN_PIXEL_DRAWING
-
- #include "mat_pixel_drawing_font.h"
-
- void draw_rectangle_c1(unsigned char* pixels, int w, int h, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- return draw_rectangle_c1(pixels, w, h, w, rx, ry, rw, rh, color, thickness);
- }
-
- void draw_rectangle_c2(unsigned char* pixels, int w, int h, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- return draw_rectangle_c2(pixels, w, h, w * 2, rx, ry, rw, rh, color, thickness);
- }
-
- void draw_rectangle_c3(unsigned char* pixels, int w, int h, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- return draw_rectangle_c3(pixels, w, h, w * 3, rx, ry, rw, rh, color, thickness);
- }
-
- void draw_rectangle_c4(unsigned char* pixels, int w, int h, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- return draw_rectangle_c4(pixels, w, h, w * 4, rx, ry, rw, rh, color, thickness);
- }
-
- void draw_rectangle_c1(unsigned char* pixels, int w, int h, int stride, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- if (thickness == -1)
- {
- // filled
- for (int y = ry; y < ry + rh; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx; x < rx + rw; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x] = pen_color[0];
- }
- }
-
- return;
- }
-
- const int t0 = thickness / 2;
- const int t1 = thickness - t0;
-
- // draw top
- {
- for (int y = ry - t0; y < ry + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x] = pen_color[0];
- }
- }
- }
-
- // draw bottom
- {
- for (int y = ry + rh - t0; y < ry + rh + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x] = pen_color[0];
- }
- }
- }
-
- // draw left
- for (int x = rx - t0; x < rx + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- for (int y = ry + t1; y < ry + rh - t0; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- p[x] = pen_color[0];
- }
- }
-
- // draw right
- for (int x = rx + rw - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- for (int y = ry + t1; y < ry + rh - t0; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- p[x] = pen_color[0];
- }
- }
- }
-
- void draw_rectangle_c2(unsigned char* pixels, int w, int h, int stride, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- if (thickness == -1)
- {
- // filled
- for (int y = ry; y < ry + rh; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx; x < rx + rw; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 2 + 0] = pen_color[0];
- p[x * 2 + 1] = pen_color[1];
- }
- }
-
- return;
- }
-
- const int t0 = thickness / 2;
- const int t1 = thickness - t0;
-
- // draw top
- {
- for (int y = ry - t0; y < ry + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 2 + 0] = pen_color[0];
- p[x * 2 + 1] = pen_color[1];
- }
- }
- }
-
- // draw bottom
- {
- for (int y = ry + rh - t0; y < ry + rh + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 2 + 0] = pen_color[0];
- p[x * 2 + 1] = pen_color[1];
- }
- }
- }
-
- // draw left
- for (int x = rx - t0; x < rx + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- for (int y = ry + t1; y < ry + rh - t0; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- p[x * 2 + 0] = pen_color[0];
- p[x * 2 + 1] = pen_color[1];
- }
- }
-
- // draw right
- for (int x = rx + rw - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- for (int y = ry + t1; y < ry + rh - t0; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- p[x * 2 + 0] = pen_color[0];
- p[x * 2 + 1] = pen_color[1];
- }
- }
- }
-
- void draw_rectangle_c3(unsigned char* pixels, int w, int h, int stride, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- if (thickness == -1)
- {
- // filled
- for (int y = ry; y < ry + rh; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx; x < rx + rw; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 3 + 0] = pen_color[0];
- p[x * 3 + 1] = pen_color[1];
- p[x * 3 + 2] = pen_color[2];
- }
- }
-
- return;
- }
-
- const int t0 = thickness / 2;
- const int t1 = thickness - t0;
-
- // draw top
- {
- for (int y = ry - t0; y < ry + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 3 + 0] = pen_color[0];
- p[x * 3 + 1] = pen_color[1];
- p[x * 3 + 2] = pen_color[2];
- }
- }
- }
-
- // draw bottom
- {
- for (int y = ry + rh - t0; y < ry + rh + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 3 + 0] = pen_color[0];
- p[x * 3 + 1] = pen_color[1];
- p[x * 3 + 2] = pen_color[2];
- }
- }
- }
-
- // draw left
- for (int x = rx - t0; x < rx + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- for (int y = ry + t1; y < ry + rh - t0; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- p[x * 3 + 0] = pen_color[0];
- p[x * 3 + 1] = pen_color[1];
- p[x * 3 + 2] = pen_color[2];
- }
- }
-
- // draw right
- for (int x = rx + rw - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- for (int y = ry + t1; y < ry + rh - t0; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- p[x * 3 + 0] = pen_color[0];
- p[x * 3 + 1] = pen_color[1];
- p[x * 3 + 2] = pen_color[2];
- }
- }
- }
-
- void draw_rectangle_c4(unsigned char* pixels, int w, int h, int stride, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- if (thickness == -1)
- {
- // filled
- for (int y = ry; y < ry + rh; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx; x < rx + rw; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 4 + 0] = pen_color[0];
- p[x * 4 + 1] = pen_color[1];
- p[x * 4 + 2] = pen_color[2];
- p[x * 4 + 3] = pen_color[3];
- }
- }
-
- return;
- }
-
- const int t0 = thickness / 2;
- const int t1 = thickness - t0;
-
- // draw top
- {
- for (int y = ry - t0; y < ry + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 4 + 0] = pen_color[0];
- p[x * 4 + 1] = pen_color[1];
- p[x * 4 + 2] = pen_color[2];
- p[x * 4 + 3] = pen_color[3];
- }
- }
- }
-
- // draw bottom
- {
- for (int y = ry + rh - t0; y < ry + rh + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = rx - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- p[x * 4 + 0] = pen_color[0];
- p[x * 4 + 1] = pen_color[1];
- p[x * 4 + 2] = pen_color[2];
- p[x * 4 + 3] = pen_color[3];
- }
- }
- }
-
- // draw left
- for (int x = rx - t0; x < rx + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- for (int y = ry + t1; y < ry + rh - t0; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- p[x * 4 + 0] = pen_color[0];
- p[x * 4 + 1] = pen_color[1];
- p[x * 4 + 2] = pen_color[2];
- p[x * 4 + 3] = pen_color[3];
- }
- }
-
- // draw right
- for (int x = rx + rw - t0; x < rx + rw + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- for (int y = ry + t1; y < ry + rh - t0; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- p[x * 4 + 0] = pen_color[0];
- p[x * 4 + 1] = pen_color[1];
- p[x * 4 + 2] = pen_color[2];
- p[x * 4 + 3] = pen_color[3];
- }
- }
- }
-
- void draw_rectangle_yuv420sp(unsigned char* yuv420sp, int w, int h, int rx, int ry, int rw, int rh, unsigned int color, int thickness)
- {
- // assert w % 2 == 0
- // assert h % 2 == 0
- // assert rx % 2 == 0
- // assert ry % 2 == 0
- // assert rw % 2 == 0
- // assert rh % 2 == 0
- // assert thickness % 2 == 0
-
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- unsigned int v_y;
- unsigned int v_uv;
- unsigned char* pen_color_y = (unsigned char*)&v_y;
- unsigned char* pen_color_uv = (unsigned char*)&v_uv;
- pen_color_y[0] = pen_color[0];
- pen_color_uv[0] = pen_color[1];
- pen_color_uv[1] = pen_color[2];
-
- unsigned char* Y = yuv420sp;
- draw_rectangle_c1(Y, w, h, rx, ry, rw, rh, v_y, thickness);
-
- unsigned char* UV = yuv420sp + w * h;
- int thickness_uv = thickness == -1 ? thickness : std::max(thickness / 2, 1);
- draw_rectangle_c2(UV, w / 2, h / 2, rx / 2, ry / 2, rw / 2, rh / 2, v_uv, thickness_uv);
- }
-
- static inline bool distance_lessequal(int x0, int y0, int x1, int y1, float r)
- {
- int dx = x0 - x1;
- int dy = y0 - y1;
- int q = dx * dx + dy * dy;
- return q <= r * r;
- }
-
- static inline bool distance_inrange(int x0, int y0, int x1, int y1, float r0, float r1)
- {
- int dx = x0 - x1;
- int dy = y0 - y1;
- int q = dx * dx + dy * dy;
- return q >= r0 * r0 && q < r1 * r1;
- }
-
- void draw_circle_c1(unsigned char* pixels, int w, int h, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- return draw_circle_c1(pixels, w, h, w, cx, cy, radius, color, thickness);
- }
-
- void draw_circle_c2(unsigned char* pixels, int w, int h, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- return draw_circle_c2(pixels, w, h, w * 2, cx, cy, radius, color, thickness);
- }
-
- void draw_circle_c3(unsigned char* pixels, int w, int h, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- return draw_circle_c3(pixels, w, h, w * 3, cx, cy, radius, color, thickness);
- }
-
- void draw_circle_c4(unsigned char* pixels, int w, int h, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- return draw_circle_c4(pixels, w, h, w * 4, cx, cy, radius, color, thickness);
- }
-
- void draw_circle_c1(unsigned char* pixels, int w, int h, int stride, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- if (thickness == -1)
- {
- // filled
- for (int y = cy - (radius - 1); y < cy + radius; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = cx - (radius - 1); x < cx + radius; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from cx cy
- if (distance_lessequal(x, y, cx, cy, radius))
- {
- p[x] = pen_color[0];
- }
- }
- }
-
- return;
- }
-
- const float t0 = thickness / 2.f;
- const float t1 = thickness - t0;
-
- for (int y = cy - (radius - 1) - t0; y < cy + radius + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = cx - (radius - 1) - t0; x < cx + radius + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from cx cy
- if (distance_inrange(x, y, cx, cy, radius - t0, radius + t1))
- {
- p[x] = pen_color[0];
- }
- }
- }
- }
-
- void draw_circle_c2(unsigned char* pixels, int w, int h, int stride, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- if (thickness == -1)
- {
- // filled
- for (int y = cy - (radius - 1); y < cy + radius; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = cx - (radius - 1); x < cx + radius; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from cx cy
- if (distance_lessequal(x, y, cx, cy, radius))
- {
- p[x * 2 + 0] = pen_color[0];
- p[x * 2 + 1] = pen_color[1];
- }
- }
- }
-
- return;
- }
-
- const float t0 = thickness / 2.f;
- const float t1 = thickness - t0;
-
- for (int y = cy - radius - t0; y < cy + radius + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = cx - radius - t0; x < cx + radius + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from cx cy
- if (distance_inrange(x, y, cx, cy, radius - t0, radius + t1))
- {
- p[x * 2 + 0] = pen_color[0];
- p[x * 2 + 1] = pen_color[1];
- }
- }
- }
- }
-
- void draw_circle_c3(unsigned char* pixels, int w, int h, int stride, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- if (thickness == -1)
- {
- // filled
- for (int y = cy - (radius - 1); y < cy + radius; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = cx - (radius - 1); x < cx + radius; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from cx cy
- if (distance_lessequal(x, y, cx, cy, radius))
- {
- p[x * 3 + 0] = pen_color[0];
- p[x * 3 + 1] = pen_color[1];
- p[x * 3 + 2] = pen_color[2];
- }
- }
- }
-
- return;
- }
-
- const float t0 = thickness / 2.f;
- const float t1 = thickness - t0;
-
- for (int y = cy - radius - t0; y < cy + radius + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = cx - radius - t0; x < cx + radius + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from cx cy
- if (distance_inrange(x, y, cx, cy, radius - t0, radius + t1))
- {
- p[x * 3 + 0] = pen_color[0];
- p[x * 3 + 1] = pen_color[1];
- p[x * 3 + 2] = pen_color[2];
- }
- }
- }
- }
-
- void draw_circle_c4(unsigned char* pixels, int w, int h, int stride, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- if (thickness == -1)
- {
- // filled
- for (int y = cy - (radius - 1); y < cy + radius; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = cx - (radius - 1); x < cx + radius; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from cx cy
- if (distance_lessequal(x, y, cx, cy, radius))
- {
- p[x * 4 + 0] = pen_color[0];
- p[x * 4 + 1] = pen_color[1];
- p[x * 4 + 2] = pen_color[2];
- p[x * 4 + 3] = pen_color[3];
- }
- }
- }
-
- return;
- }
-
- const float t0 = thickness / 2.f;
- const float t1 = thickness - t0;
-
- for (int y = cy - (radius - 1) - t0; y < cy + radius + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = cx - (radius - 1) - t0; x < cx + radius + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from cx cy
- if (distance_inrange(x, y, cx, cy, radius - t0, radius + t1))
- {
- p[x * 4 + 0] = pen_color[0];
- p[x * 4 + 1] = pen_color[1];
- p[x * 4 + 2] = pen_color[2];
- p[x * 4 + 3] = pen_color[3];
- }
- }
- }
- }
-
- void draw_circle_yuv420sp(unsigned char* yuv420sp, int w, int h, int cx, int cy, int radius, unsigned int color, int thickness)
- {
- // assert w % 2 == 0
- // assert h % 2 == 0
- // assert cx % 2 == 0
- // assert cy % 2 == 0
- // assert radius % 2 == 0
- // assert thickness % 2 == 0
-
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- unsigned int v_y;
- unsigned int v_uv;
- unsigned char* pen_color_y = (unsigned char*)&v_y;
- unsigned char* pen_color_uv = (unsigned char*)&v_uv;
- pen_color_y[0] = pen_color[0];
- pen_color_uv[0] = pen_color[1];
- pen_color_uv[1] = pen_color[2];
-
- unsigned char* Y = yuv420sp;
- draw_circle_c1(Y, w, h, cx, cy, radius, v_y, thickness);
-
- unsigned char* UV = yuv420sp + w * h;
- int thickness_uv = thickness == -1 ? thickness : std::max(thickness / 2, 1);
- draw_circle_c2(UV, w / 2, h / 2, cx / 2, cy / 2, radius / 2, v_uv, thickness_uv);
- }
-
- static inline bool distance_lessthan(int x, int y, int x0, int y0, int x1, int y1, float t)
- {
- int dx01 = x1 - x0;
- int dy01 = y1 - y0;
- int dx0 = x - x0;
- int dy0 = y - y0;
-
- float r = (float)(dx0 * dx01 + dy0 * dy01) / (dx01 * dx01 + dy01 * dy01);
-
- if (r < 0 || r > 1)
- return false;
-
- float px = x0 + dx01 * r;
- float py = y0 + dy01 * r;
- float dx = x - px;
- float dy = y - py;
- float p = dx * dx + dy * dy;
- return p < t;
- }
-
- void draw_line_c1(unsigned char* pixels, int w, int h, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- draw_line_c1(pixels, w, h, w, x0, y0, x1, y1, color, thickness);
- }
-
- void draw_line_c2(unsigned char* pixels, int w, int h, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- draw_line_c2(pixels, w, h, w * 2, x0, y0, x1, y1, color, thickness);
- }
-
- void draw_line_c3(unsigned char* pixels, int w, int h, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- draw_line_c3(pixels, w, h, w * 3, x0, y0, x1, y1, color, thickness);
- }
-
- void draw_line_c4(unsigned char* pixels, int w, int h, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- draw_line_c4(pixels, w, h, w * 4, x0, y0, x1, y1, color, thickness);
- }
-
- void draw_line_c1(unsigned char* pixels, int w, int h, int stride, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- const float t0 = thickness / 2.f;
- const float t1 = thickness - t0;
-
- int x_min = std::min(x0, x1);
- int x_max = std::max(x0, x1);
- int y_min = std::min(y0, y1);
- int y_max = std::max(y0, y1);
-
- for (int y = y_min - t0; y < y_max + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = x_min - t0; x < x_max + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from line
- if (distance_lessthan(x, y, x0, y0, x1, y1, t1))
- {
- p[x] = pen_color[0];
- }
- }
- }
- }
-
- void draw_line_c2(unsigned char* pixels, int w, int h, int stride, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- const float t0 = thickness / 2.f;
- const float t1 = thickness - t0;
-
- int x_min = std::min(x0, x1);
- int x_max = std::max(x0, x1);
- int y_min = std::min(y0, y1);
- int y_max = std::max(y0, y1);
-
- for (int y = y_min - t0; y < y_max + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = x_min - t0; x < x_max + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from line
- if (distance_lessthan(x, y, x0, y0, x1, y1, t1))
- {
- p[x * 2 + 0] = pen_color[0];
- p[x * 2 + 1] = pen_color[1];
- }
- }
- }
- }
-
- void draw_line_c3(unsigned char* pixels, int w, int h, int stride, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- const float t0 = thickness / 2.f;
- const float t1 = thickness - t0;
-
- int x_min = std::min(x0, x1);
- int x_max = std::max(x0, x1);
- int y_min = std::min(y0, y1);
- int y_max = std::max(y0, y1);
-
- for (int y = y_min - t0; y < y_max + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = x_min - t0; x < x_max + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from line
- if (distance_lessthan(x, y, x0, y0, x1, y1, t1))
- {
- p[x * 3 + 0] = pen_color[0];
- p[x * 3 + 1] = pen_color[1];
- p[x * 3 + 2] = pen_color[2];
- }
- }
- }
- }
-
- void draw_line_c4(unsigned char* pixels, int w, int h, int stride, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- const float t0 = thickness / 2.f;
- const float t1 = thickness - t0;
-
- int x_min = std::min(x0, x1);
- int x_max = std::max(x0, x1);
- int y_min = std::min(y0, y1);
- int y_max = std::max(y0, y1);
-
- for (int y = y_min - t0; y < y_max + t1; y++)
- {
- if (y < 0)
- continue;
-
- if (y >= h)
- break;
-
- unsigned char* p = pixels + stride * y;
-
- for (int x = x_min - t0; x < x_max + t1; x++)
- {
- if (x < 0)
- continue;
-
- if (x >= w)
- break;
-
- // distance from line
- if (distance_lessthan(x, y, x0, y0, x1, y1, t1))
- {
- p[x * 4 + 0] = pen_color[0];
- p[x * 4 + 1] = pen_color[1];
- p[x * 4 + 2] = pen_color[2];
- p[x * 4 + 3] = pen_color[3];
- }
- }
- }
- }
-
- void draw_line_yuv420sp(unsigned char* yuv420sp, int w, int h, int x0, int y0, int x1, int y1, unsigned int color, int thickness)
- {
- // assert w % 2 == 0
- // assert h % 2 == 0
- // assert x0 % 2 == 0
- // assert y0 % 2 == 0
- // assert x1 % 2 == 0
- // assert y1 % 2 == 0
- // assert thickness % 2 == 0
-
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- unsigned int v_y;
- unsigned int v_uv;
- unsigned char* pen_color_y = (unsigned char*)&v_y;
- unsigned char* pen_color_uv = (unsigned char*)&v_uv;
- pen_color_y[0] = pen_color[0];
- pen_color_uv[0] = pen_color[1];
- pen_color_uv[1] = pen_color[2];
-
- unsigned char* Y = yuv420sp;
- draw_line_c1(Y, w, h, x0, y0, x1, y1, v_y, thickness);
-
- unsigned char* UV = yuv420sp + w * h;
- int thickness_uv = thickness == -1 ? thickness : std::max(thickness / 2, 1);
- draw_line_c2(UV, w / 2, h / 2, x0 / 2, y0 / 2, x1 / 2, y1 / 2, v_uv, thickness_uv);
- }
-
- void get_text_drawing_size(const char* text, int fontpixelsize, int* w, int* h)
- {
- *w = 0;
- *h = 0;
-
- const int n = strlen(text);
-
- int line_w = 0;
- for (int i = 0; i < n; i++)
- {
- char ch = text[i];
-
- if (ch == '\n')
- {
- // newline
- *w = std::max(*w, line_w);
- *h += fontpixelsize * 2;
- line_w = 0;
- }
-
- if (isprint(ch) != 0)
- {
- line_w += fontpixelsize;
- }
- }
-
- *w = std::max(*w, line_w);
- *h += fontpixelsize * 2;
- }
-
- void draw_text_c1(unsigned char* pixels, int w, int h, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- return draw_text_c1(pixels, w, h, w, text, x, y, fontpixelsize, color);
- }
-
- void draw_text_c2(unsigned char* pixels, int w, int h, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- return draw_text_c2(pixels, w, h, w * 2, text, x, y, fontpixelsize, color);
- }
-
- void draw_text_c3(unsigned char* pixels, int w, int h, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- return draw_text_c3(pixels, w, h, w * 3, text, x, y, fontpixelsize, color);
- }
-
- void draw_text_c4(unsigned char* pixels, int w, int h, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- return draw_text_c4(pixels, w, h, w * 4, text, x, y, fontpixelsize, color);
- }
-
- void resize_bilinear_font(const unsigned char* font_bitmap, unsigned char* resized_font_bitmap, int fontpixelsize)
- {
- const int INTER_RESIZE_COEF_BITS = 11;
- const int INTER_RESIZE_COEF_SCALE = 1 << INTER_RESIZE_COEF_BITS;
-
- const int srcw = 20;
- const int srch = 40;
- const int w = fontpixelsize;
- const int h = fontpixelsize * 2;
-
- double scale = (double)srcw / w;
-
- int* buf = new int[w + h + w + h];
-
- int* xofs = buf; //new int[w];
- int* yofs = buf + w; //new int[h];
-
- short* ialpha = (short*)(buf + w + h); //new short[w * 2];
- short* ibeta = (short*)(buf + w + h + w); //new short[h * 2];
-
- float fx;
- float fy;
- int sx;
- int sy;
-
- #define SATURATE_CAST_SHORT(X) (short)::std::min(::std::max((int)(X + (X >= 0.f ? 0.5f : -0.5f)), SHRT_MIN), SHRT_MAX);
-
- for (int dx = 0; dx < w; dx++)
- {
- fx = (float)((dx + 0.5) * scale - 0.5);
- sx = static_cast<int>(floor(fx));
- fx -= sx;
-
- xofs[dx] = sx;
-
- float a0 = (1.f - fx) * INTER_RESIZE_COEF_SCALE;
- float a1 = fx * INTER_RESIZE_COEF_SCALE;
-
- ialpha[dx * 2] = SATURATE_CAST_SHORT(a0);
- ialpha[dx * 2 + 1] = SATURATE_CAST_SHORT(a1);
- }
-
- for (int dy = 0; dy < h; dy++)
- {
- fy = (float)((dy + 0.5) * scale - 0.5);
- sy = static_cast<int>(floor(fy));
- fy -= sy;
-
- yofs[dy] = sy;
-
- float b0 = (1.f - fy) * INTER_RESIZE_COEF_SCALE;
- float b1 = fy * INTER_RESIZE_COEF_SCALE;
-
- ibeta[dy * 2] = SATURATE_CAST_SHORT(b0);
- ibeta[dy * 2 + 1] = SATURATE_CAST_SHORT(b1);
- }
-
- #undef SATURATE_CAST_SHORT
-
- // loop body
- Mat rowsbuf0(w, (size_t)2u);
- Mat rowsbuf1(w, (size_t)2u);
- short* rows0 = (short*)rowsbuf0;
- short* rows1 = (short*)rowsbuf1;
-
- {
- short* rows1p = rows1;
- for (int dx = 0; dx < w; dx++)
- {
- rows1p[dx] = 0;
- }
- }
-
- int prev_sy1 = -2;
-
- for (int dy = 0; dy < h; dy++)
- {
- sy = yofs[dy];
-
- if (sy == prev_sy1)
- {
- // reuse all rows
- }
- else if (sy == prev_sy1 + 1)
- {
- // hresize one row
- short* rows0_old = rows0;
- rows0 = rows1;
- rows1 = rows0_old;
- const unsigned char* S1 = font_bitmap + 10 * (sy + 1);
-
- if (sy >= srch - 1)
- {
- short* rows1p = rows1;
- for (int dx = 0; dx < w; dx++)
- {
- rows1p[dx] = 0;
- }
- }
- else
- {
- const short* ialphap = ialpha;
- short* rows1p = rows1;
- for (int dx = 0; dx < w; dx++)
- {
- sx = xofs[dx];
- short a0 = ialphap[0];
- short a1 = ialphap[1];
-
- unsigned char S1p0;
- unsigned char S1p1;
-
- if (sx < 0)
- {
- S1p0 = 0;
- S1p1 = S1[0] & 0x0f;
- }
- else if (sx >= srcw - 1)
- {
- S1p0 = (S1[9] & 0xf0) >> 4;
- S1p1 = 0;
- }
- else
- {
- S1p0 = sx % 2 == 0 ? S1[sx / 2] & 0x0f : (S1[sx / 2] & 0xf0) >> 4;
- S1p1 = sx % 2 == 0 ? (S1[sx / 2] & 0xf0) >> 4 : S1[sx / 2 + 1] & 0x0f;
- }
- rows1p[dx] = (S1p0 * a0 + S1p1 * a1) * 17 >> 4;
-
- ialphap += 2;
- }
- }
- }
- else
- {
- // hresize two rows
- const unsigned char* S0 = font_bitmap + 10 * (sy);
- const unsigned char* S1 = font_bitmap + 10 * (sy + 1);
-
- if (sy >= srch - 1)
- {
- const short* ialphap = ialpha;
- short* rows0p = rows0;
- short* rows1p = rows1;
- for (int dx = 0; dx < w; dx++)
- {
- sx = xofs[dx];
- short a0 = ialphap[0];
- short a1 = ialphap[1];
-
- unsigned char S0p0;
- unsigned char S0p1;
-
- if (sx < 0)
- {
- S0p0 = 0;
- S0p1 = S0[0] & 0x0f;
- }
- else if (sx >= srcw - 1)
- {
- S0p0 = (S0[9] & 0xf0) >> 4;
- S0p1 = 0;
- }
- else
- {
- S0p0 = sx % 2 == 0 ? S0[sx / 2] & 0x0f : (S0[sx / 2] & 0xf0) >> 4;
- S0p1 = sx % 2 == 0 ? (S0[sx / 2] & 0xf0) >> 4 : S0[sx / 2 + 1] & 0x0f;
- }
- rows0p[dx] = (S0p0 * a0 + S0p1 * a1) * 17 >> 4;
- rows1p[dx] = 0;
-
- ialphap += 2;
- }
- }
- else
- {
- const short* ialphap = ialpha;
- short* rows0p = rows0;
- short* rows1p = rows1;
- for (int dx = 0; dx < w; dx++)
- {
- sx = xofs[dx];
- short a0 = ialphap[0];
- short a1 = ialphap[1];
-
- unsigned char S0p0;
- unsigned char S0p1;
- unsigned char S1p0;
- unsigned char S1p1;
-
- if (sx < 0)
- {
- S0p0 = 0;
- S0p1 = S0[0] & 0x0f;
- S1p0 = 0;
- S1p1 = S1[0] & 0x0f;
- }
- else if (sx >= srcw - 1)
- {
- S0p0 = (S0[9] & 0xf0) >> 4;
- S0p1 = 0;
- S1p0 = (S1[9] & 0xf0) >> 4;
- S1p1 = 0;
- }
- else
- {
- S0p0 = sx % 2 == 0 ? S0[sx / 2] & 0x0f : (S0[sx / 2] & 0xf0) >> 4;
- S0p1 = sx % 2 == 0 ? (S0[sx / 2] & 0xf0) >> 4 : S0[sx / 2 + 1] & 0x0f;
- S1p0 = sx % 2 == 0 ? S1[sx / 2] & 0x0f : (S1[sx / 2] & 0xf0) >> 4;
- S1p1 = sx % 2 == 0 ? (S1[sx / 2] & 0xf0) >> 4 : S1[sx / 2 + 1] & 0x0f;
- }
- rows0p[dx] = (S0p0 * a0 + S0p1 * a1) * 17 >> 4;
- rows1p[dx] = (S1p0 * a0 + S1p1 * a1) * 17 >> 4;
-
- ialphap += 2;
- }
- }
- }
-
- prev_sy1 = sy;
-
- if (dy + 1 < h && yofs[dy + 1] == sy)
- {
- // vresize for two rows
- short b0 = ibeta[0];
- short b1 = ibeta[1];
- short b2 = ibeta[2];
- short b3 = ibeta[3];
-
- short* rows0p = rows0;
- short* rows1p = rows1;
- unsigned char* Dp0 = resized_font_bitmap + w * (dy);
- unsigned char* Dp1 = resized_font_bitmap + w * (dy + 1);
-
- int dx = 0;
- #if __ARM_NEON
- int16x8_t _b0 = vdupq_n_s16(b0);
- int16x8_t _b1 = vdupq_n_s16(b1);
- int16x8_t _b2 = vdupq_n_s16(b2);
- int16x8_t _b3 = vdupq_n_s16(b3);
- for (; dx + 15 < w; dx += 16)
- {
- int16x8_t _r00 = vld1q_s16(rows0p);
- int16x8_t _r01 = vld1q_s16(rows0p + 8);
- int16x8_t _r10 = vld1q_s16(rows1p);
- int16x8_t _r11 = vld1q_s16(rows1p + 8);
- int16x8_t _acc00 = vaddq_s16(vqdmulhq_s16(_r00, _b0), vqdmulhq_s16(_r10, _b1));
- int16x8_t _acc01 = vaddq_s16(vqdmulhq_s16(_r01, _b0), vqdmulhq_s16(_r11, _b1));
- int16x8_t _acc10 = vaddq_s16(vqdmulhq_s16(_r00, _b2), vqdmulhq_s16(_r10, _b3));
- int16x8_t _acc11 = vaddq_s16(vqdmulhq_s16(_r01, _b2), vqdmulhq_s16(_r11, _b3));
- uint8x16_t _Dp0 = vcombine_u8(vqrshrun_n_s16(_acc00, 3), vqrshrun_n_s16(_acc01, 3));
- uint8x16_t _Dp1 = vcombine_u8(vqrshrun_n_s16(_acc10, 3), vqrshrun_n_s16(_acc11, 3));
- vst1q_u8(Dp0, _Dp0);
- vst1q_u8(Dp1, _Dp1);
- Dp0 += 16;
- Dp1 += 16;
- rows0p += 16;
- rows1p += 16;
- }
- for (; dx + 7 < w; dx += 8)
- {
- int16x8_t _r0 = vld1q_s16(rows0p);
- int16x8_t _r1 = vld1q_s16(rows1p);
- int16x8_t _acc0 = vaddq_s16(vqdmulhq_s16(_r0, _b0), vqdmulhq_s16(_r1, _b1));
- int16x8_t _acc1 = vaddq_s16(vqdmulhq_s16(_r0, _b2), vqdmulhq_s16(_r1, _b3));
- uint8x8_t _Dp0 = vqrshrun_n_s16(_acc0, 3);
- uint8x8_t _Dp1 = vqrshrun_n_s16(_acc1, 3);
- vst1_u8(Dp0, _Dp0);
- vst1_u8(Dp1, _Dp1);
- Dp0 += 8;
- Dp1 += 8;
- rows0p += 8;
- rows1p += 8;
- }
- #endif // __ARM_NEON
- #if __SSE2__
- __m128i _b0 = _mm_set1_epi16(b0);
- __m128i _b1 = _mm_set1_epi16(b1);
- __m128i _b2 = _mm_set1_epi16(b2);
- __m128i _b3 = _mm_set1_epi16(b3);
- __m128i _v2 = _mm_set1_epi16(2);
- for (; dx + 15 < w; dx += 16)
- {
- __m128i _r00 = _mm_loadu_si128((const __m128i*)rows0p);
- __m128i _r01 = _mm_loadu_si128((const __m128i*)(rows0p + 8));
- __m128i _r10 = _mm_loadu_si128((const __m128i*)rows1p);
- __m128i _r11 = _mm_loadu_si128((const __m128i*)(rows1p + 8));
- __m128i _acc00 = _mm_add_epi16(_mm_mulhi_epi16(_r00, _b0), _mm_mulhi_epi16(_r10, _b1));
- __m128i _acc01 = _mm_add_epi16(_mm_mulhi_epi16(_r01, _b0), _mm_mulhi_epi16(_r11, _b1));
- __m128i _acc10 = _mm_add_epi16(_mm_mulhi_epi16(_r00, _b2), _mm_mulhi_epi16(_r10, _b3));
- __m128i _acc11 = _mm_add_epi16(_mm_mulhi_epi16(_r01, _b2), _mm_mulhi_epi16(_r11, _b3));
- _acc00 = _mm_srai_epi16(_mm_add_epi16(_acc00, _v2), 2);
- _acc01 = _mm_srai_epi16(_mm_add_epi16(_acc01, _v2), 2);
- _acc10 = _mm_srai_epi16(_mm_add_epi16(_acc10, _v2), 2);
- _acc11 = _mm_srai_epi16(_mm_add_epi16(_acc11, _v2), 2);
- __m128i _Dp0 = _mm_packus_epi16(_acc00, _acc01);
- __m128i _Dp1 = _mm_packus_epi16(_acc10, _acc11);
- _mm_storeu_si128((__m128i*)Dp0, _Dp0);
- _mm_storeu_si128((__m128i*)Dp1, _Dp1);
- Dp0 += 16;
- Dp1 += 16;
- rows0p += 16;
- rows1p += 16;
- }
- for (; dx + 7 < w; dx += 8)
- {
- __m128i _r0 = _mm_loadu_si128((const __m128i*)rows0p);
- __m128i _r1 = _mm_loadu_si128((const __m128i*)rows1p);
- __m128i _acc0 = _mm_add_epi16(_mm_mulhi_epi16(_r0, _b0), _mm_mulhi_epi16(_r1, _b1));
- __m128i _acc1 = _mm_add_epi16(_mm_mulhi_epi16(_r0, _b2), _mm_mulhi_epi16(_r1, _b3));
- _acc0 = _mm_srai_epi16(_mm_add_epi16(_acc0, _v2), 2);
- _acc1 = _mm_srai_epi16(_mm_add_epi16(_acc1, _v2), 2);
- __m128i _Dp0 = _mm_packus_epi16(_acc0, _acc0);
- __m128i _Dp1 = _mm_packus_epi16(_acc1, _acc1);
- _mm_storel_epi64((__m128i*)Dp0, _Dp0);
- _mm_storel_epi64((__m128i*)Dp1, _Dp1);
- Dp0 += 8;
- Dp1 += 8;
- rows0p += 8;
- rows1p += 8;
- }
- #endif // __SSE2__
- for (; dx < w; dx++)
- {
- short s0 = *rows0p++;
- short s1 = *rows1p++;
-
- *Dp0++ = (unsigned char)(((short)((b0 * s0) >> 16) + (short)((b1 * s1) >> 16) + 2) >> 2);
- *Dp1++ = (unsigned char)(((short)((b2 * s0) >> 16) + (short)((b3 * s1) >> 16) + 2) >> 2);
- }
-
- ibeta += 4;
- dy += 1;
- }
- else
- {
- // vresize
- short b0 = ibeta[0];
- short b1 = ibeta[1];
-
- short* rows0p = rows0;
- short* rows1p = rows1;
- unsigned char* Dp = resized_font_bitmap + w * (dy);
-
- int dx = 0;
- #if __ARM_NEON
- int16x8_t _b0 = vdupq_n_s16(b0);
- int16x8_t _b1 = vdupq_n_s16(b1);
- for (; dx + 15 < w; dx += 16)
- {
- int16x8_t _r00 = vld1q_s16(rows0p);
- int16x8_t _r01 = vld1q_s16(rows0p + 8);
- int16x8_t _r10 = vld1q_s16(rows1p);
- int16x8_t _r11 = vld1q_s16(rows1p + 8);
- int16x8_t _acc0 = vaddq_s16(vqdmulhq_s16(_r00, _b0), vqdmulhq_s16(_r10, _b1));
- int16x8_t _acc1 = vaddq_s16(vqdmulhq_s16(_r01, _b0), vqdmulhq_s16(_r11, _b1));
- uint8x16_t _Dp = vcombine_u8(vqrshrun_n_s16(_acc0, 3), vqrshrun_n_s16(_acc1, 3));
- vst1q_u8(Dp, _Dp);
- Dp += 16;
- rows0p += 16;
- rows1p += 16;
- }
- for (; dx + 7 < w; dx += 8)
- {
- int16x8_t _r0 = vld1q_s16(rows0p);
- int16x8_t _r1 = vld1q_s16(rows1p);
- int16x8_t _acc = vaddq_s16(vqdmulhq_s16(_r0, _b0), vqdmulhq_s16(_r1, _b1));
- uint8x8_t _Dp = vqrshrun_n_s16(_acc, 3);
- vst1_u8(Dp, _Dp);
- Dp += 8;
- rows0p += 8;
- rows1p += 8;
- }
- #endif // __ARM_NEON
- #if __SSE2__
- __m128i _b0 = _mm_set1_epi16(b0);
- __m128i _b1 = _mm_set1_epi16(b1);
- __m128i _v2 = _mm_set1_epi16(2);
- for (; dx + 15 < w; dx += 16)
- {
- __m128i _r00 = _mm_loadu_si128((const __m128i*)rows0p);
- __m128i _r01 = _mm_loadu_si128((const __m128i*)(rows0p + 8));
- __m128i _r10 = _mm_loadu_si128((const __m128i*)rows1p);
- __m128i _r11 = _mm_loadu_si128((const __m128i*)(rows1p + 8));
- __m128i _acc0 = _mm_add_epi16(_mm_mulhi_epi16(_r00, _b0), _mm_mulhi_epi16(_r10, _b1));
- __m128i _acc1 = _mm_add_epi16(_mm_mulhi_epi16(_r01, _b0), _mm_mulhi_epi16(_r11, _b1));
- _acc0 = _mm_srai_epi16(_mm_add_epi16(_acc0, _v2), 2);
- _acc1 = _mm_srai_epi16(_mm_add_epi16(_acc1, _v2), 2);
- __m128i _Dp = _mm_packus_epi16(_acc0, _acc1);
- _mm_storeu_si128((__m128i*)Dp, _Dp);
- Dp += 16;
- rows0p += 16;
- rows1p += 16;
- }
- for (; dx + 7 < w; dx += 8)
- {
- __m128i _r0 = _mm_loadu_si128((const __m128i*)rows0p);
- __m128i _r1 = _mm_loadu_si128((const __m128i*)rows1p);
- __m128i _acc = _mm_add_epi16(_mm_mulhi_epi16(_r0, _b0), _mm_mulhi_epi16(_r1, _b1));
- _acc = _mm_srai_epi16(_mm_add_epi16(_acc, _v2), 2);
- __m128i _Dp = _mm_packus_epi16(_acc, _acc);
- _mm_storel_epi64((__m128i*)Dp, _Dp);
- Dp += 8;
- rows0p += 8;
- rows1p += 8;
- }
- #endif // __SSE2__
- for (; dx < w; dx++)
- {
- short s0 = *rows0p++;
- short s1 = *rows1p++;
-
- *Dp++ = (unsigned char)(((short)((b0 * s0) >> 16) + (short)((b1 * s1) >> 16) + 2) >> 2);
- }
-
- ibeta += 2;
- }
- }
-
- delete[] buf;
- }
-
- void draw_text_c1(unsigned char* pixels, int w, int h, int stride, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- unsigned char* resized_font_bitmap = new unsigned char[fontpixelsize * fontpixelsize * 2];
-
- const int n = strlen(text);
-
- int cursor_x = x;
- int cursor_y = y;
- for (int i = 0; i < n; i++)
- {
- char ch = text[i];
-
- if (ch == '\n')
- {
- // newline
- cursor_x = x;
- cursor_y += fontpixelsize * 2;
- continue;
- }
-
- if (ch == ' ')
- {
- cursor_x += fontpixelsize;
- continue;
- }
-
- if (isprint(ch) != 0)
- {
- const unsigned char* font_bitmap = mono_font_data[ch - '!'];
-
- // draw resized character
- resize_bilinear_font(font_bitmap, resized_font_bitmap, fontpixelsize);
-
- const int ystart = std::max(cursor_y, 0);
- const int yend = std::min(cursor_y + fontpixelsize * 2, h);
- const int xstart = std::max(cursor_x, 0);
- const int xend = std::min(cursor_x + fontpixelsize, w);
-
- for (int j = ystart; j < yend; j++)
- {
- const unsigned char* palpha = resized_font_bitmap + (j - cursor_y) * fontpixelsize + xstart - cursor_x;
- unsigned char* p = pixels + stride * j + xstart;
-
- for (int k = xstart; k < xend; k++)
- {
- unsigned char alpha = *palpha++;
-
- p[0] = (p[0] * (255 - alpha) + pen_color[0] * alpha) / 255;
- p += 1;
- }
- }
-
- cursor_x += fontpixelsize;
- }
- }
-
- delete[] resized_font_bitmap;
- }
-
- void draw_text_c2(unsigned char* pixels, int w, int h, int stride, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- unsigned char* resized_font_bitmap = new unsigned char[fontpixelsize * fontpixelsize * 2];
-
- const int n = strlen(text);
-
- int cursor_x = x;
- int cursor_y = y;
- for (int i = 0; i < n; i++)
- {
- char ch = text[i];
-
- if (ch == '\n')
- {
- // newline
- cursor_x = x;
- cursor_y += fontpixelsize * 2;
- continue;
- }
-
- if (ch == ' ')
- {
- cursor_x += fontpixelsize;
- continue;
- }
-
- if (isprint(ch) != 0)
- {
- const unsigned char* font_bitmap = mono_font_data[ch - '!'];
-
- // draw resized character
- resize_bilinear_font(font_bitmap, resized_font_bitmap, fontpixelsize);
-
- const int ystart = std::max(cursor_y, 0);
- const int yend = std::min(cursor_y + fontpixelsize * 2, h);
- const int xstart = std::max(cursor_x, 0);
- const int xend = std::min(cursor_x + fontpixelsize, w);
-
- for (int j = ystart; j < yend; j++)
- {
- const unsigned char* palpha = resized_font_bitmap + (j - cursor_y) * fontpixelsize + xstart - cursor_x;
- unsigned char* p = pixels + stride * j + xstart * 2;
-
- for (int k = xstart; k < xend; k++)
- {
- unsigned char alpha = *palpha++;
-
- p[0] = (p[0] * (255 - alpha) + pen_color[0] * alpha) / 255;
- p[1] = (p[1] * (255 - alpha) + pen_color[1] * alpha) / 255;
- p += 2;
- }
- }
-
- cursor_x += fontpixelsize;
- }
- }
-
- delete[] resized_font_bitmap;
- }
-
- void draw_text_c3(unsigned char* pixels, int w, int h, int stride, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- unsigned char* resized_font_bitmap = new unsigned char[fontpixelsize * fontpixelsize * 2];
-
- const int n = strlen(text);
-
- int cursor_x = x;
- int cursor_y = y;
- for (int i = 0; i < n; i++)
- {
- char ch = text[i];
-
- if (ch == '\n')
- {
- // newline
- cursor_x = x;
- cursor_y += fontpixelsize * 2;
- continue;
- }
-
- if (ch == ' ')
- {
- cursor_x += fontpixelsize;
- continue;
- }
-
- if (isprint(ch) != 0)
- {
- const unsigned char* font_bitmap = mono_font_data[ch - '!'];
-
- // draw resized character
- resize_bilinear_font(font_bitmap, resized_font_bitmap, fontpixelsize);
-
- const int ystart = std::max(cursor_y, 0);
- const int yend = std::min(cursor_y + fontpixelsize * 2, h);
- const int xstart = std::max(cursor_x, 0);
- const int xend = std::min(cursor_x + fontpixelsize, w);
-
- for (int j = ystart; j < yend; j++)
- {
- const unsigned char* palpha = resized_font_bitmap + (j - cursor_y) * fontpixelsize + xstart - cursor_x;
- unsigned char* p = pixels + stride * j + xstart * 3;
-
- for (int k = xstart; k < xend; k++)
- {
- unsigned char alpha = *palpha++;
-
- p[0] = (p[0] * (255 - alpha) + pen_color[0] * alpha) / 255;
- p[1] = (p[1] * (255 - alpha) + pen_color[1] * alpha) / 255;
- p[2] = (p[2] * (255 - alpha) + pen_color[2] * alpha) / 255;
- p += 3;
- }
- }
-
- cursor_x += fontpixelsize;
- }
- }
-
- delete[] resized_font_bitmap;
- }
-
- void draw_text_c4(unsigned char* pixels, int w, int h, int stride, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- unsigned char* resized_font_bitmap = new unsigned char[fontpixelsize * fontpixelsize * 2];
-
- const int n = strlen(text);
-
- int cursor_x = x;
- int cursor_y = y;
- for (int i = 0; i < n; i++)
- {
- char ch = text[i];
-
- if (ch == '\n')
- {
- // newline
- cursor_x = x;
- cursor_y += fontpixelsize * 2;
- continue;
- }
-
- if (ch == ' ')
- {
- cursor_x += fontpixelsize;
- continue;
- }
-
- if (isprint(ch) != 0)
- {
- const unsigned char* font_bitmap = mono_font_data[ch - '!'];
-
- // draw resized character
- resize_bilinear_font(font_bitmap, resized_font_bitmap, fontpixelsize);
-
- const int ystart = std::max(cursor_y, 0);
- const int yend = std::min(cursor_y + fontpixelsize * 2, h);
- const int xstart = std::max(cursor_x, 0);
- const int xend = std::min(cursor_x + fontpixelsize, w);
-
- for (int j = ystart; j < yend; j++)
- {
- const unsigned char* palpha = resized_font_bitmap + (j - cursor_y) * fontpixelsize + xstart - cursor_x;
- unsigned char* p = pixels + stride * j + xstart * 4;
-
- for (int k = xstart; k < xend; k++)
- {
- unsigned char alpha = *palpha++;
-
- p[0] = (p[0] * (255 - alpha) + pen_color[0] * alpha) / 255;
- p[1] = (p[1] * (255 - alpha) + pen_color[1] * alpha) / 255;
- p[2] = (p[2] * (255 - alpha) + pen_color[2] * alpha) / 255;
- p[3] = (p[3] * (255 - alpha) + pen_color[3] * alpha) / 255;
- p += 4;
- }
- }
-
- cursor_x += fontpixelsize;
- }
- }
-
- delete[] resized_font_bitmap;
- }
-
- void draw_text_yuv420sp(unsigned char* yuv420sp, int w, int h, const char* text, int x, int y, int fontpixelsize, unsigned int color)
- {
- // assert w % 2 == 0
- // assert h % 2 == 0
- // assert x % 2 == 0
- // assert y % 2 == 0
- // assert fontpixelsize % 2 == 0
-
- const unsigned char* pen_color = (const unsigned char*)&color;
-
- unsigned int v_y;
- unsigned int v_uv;
- unsigned char* pen_color_y = (unsigned char*)&v_y;
- unsigned char* pen_color_uv = (unsigned char*)&v_uv;
- pen_color_y[0] = pen_color[0];
- pen_color_uv[0] = pen_color[1];
- pen_color_uv[1] = pen_color[2];
-
- unsigned char* Y = yuv420sp;
- draw_text_c1(Y, w, h, text, x, y, fontpixelsize, v_y);
-
- unsigned char* UV = yuv420sp + w * h;
- draw_text_c2(UV, w / 2, h / 2, text, x / 2, y / 2, std::max(fontpixelsize / 2, 1), v_uv);
- }
-
- #endif // NCNN_PIXEL_DRAWING
-
- } // namespace ncnn
|