12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260326132623263326432653266326732683269327032713272327332743275327632773278327932803281328232833284328532863287328832893290329132923293329432953296329732983299330033013302330333043305330633073308330933103311331233133314331533163317331833193320332133223323332433253326332733283329333033313332333333343335333633373338333933403341334233433344334533463347334833493350335133523353335433553356335733583359336033613362336333643365336633673368336933703371337233733374337533763377337833793380338133823383338433853386338733883389339033913392339333943395339633973398339934003401340234033404340534063407340834093410341134123413341434153416341734183419342034213422342334243425342634273428342934303431343234333434343534363437343834393440344134423443344434453446344734483449345034513452345334543455345634573458345934603461346234633464346534663467346834693470347134723473347434753476347734783479348034813482348334843485348634873488348934903491349234933494349534963497349834993500350135023503350435053506350735083509351035113512351335143515351635173518351935203521352235233524352535263527352835293530353135323533353435353536353735383539354035413542354335443545354635473548354935503551355235533554355535563557355835593560356135623563356435653566356735683569357035713572357335743575357635773578357935803581358235833584358535863587358835893590 |
- /*
- * Copyright 2024 Vsevolod Stakhov
- *
- * Licensed under the Apache License, Version 2.0 (the "License");
- * you may not use this file except in compliance with the License.
- * You may obtain a copy of the License at
- *
- * http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
- #include "lua_common.h"
- #include "unix-std.h"
- #include "lua_compress.h"
- #include "libmime/email_addr.h"
- #include "libmime/content_type.h"
- #include "libmime/mime_headers.h"
- #include "libutil/hash.h"
-
- #include "lua_parsers.h"
-
- #ifdef WITH_LUA_REPL
- #include "replxx.h"
- #endif
-
- #include <math.h>
- #include <glob.h>
-
- #include "unicode/uspoof.h"
- #include "unicode/uscript.h"
- #include "contrib/fastutf8/fastutf8.h"
-
- /***
- * @module rspamd_util
- * This module contains some generic purpose utilities that could be useful for
- * testing and production rules.
- */
-
- /***
- * @function util.create_event_base()
- * Creates new event base for processing asynchronous events
- * @return {ev_base} new event processing base
- */
- LUA_FUNCTION_DEF(util, create_event_base);
- /***
- * @function util.load_rspamd_config(filename)
- * Load rspamd config from the specified file
- * @return {confg} new configuration object suitable for access
- */
- LUA_FUNCTION_DEF(util, load_rspamd_config);
- /***
- * @function util.config_from_ucl(any, string)
- * Load rspamd config from ucl represented by any lua table
- * @return {confg} new configuration object suitable for access
- */
- LUA_FUNCTION_DEF(util, config_from_ucl);
- /***
- * @function util.encode_base64(input[, str_len, [newlines_type]])
- * Encodes data in base64 breaking lines if needed
- * @param {text or string} input input data
- * @param {number} str_len optional size of lines or 0 if split is not needed
- * @return {rspamd_text} encoded data chunk
- */
- LUA_FUNCTION_DEF(util, encode_base64);
- /***
- * @function util.encode_qp(input[, str_len, [newlines_type]])
- * Encodes data in quoted printable breaking lines if needed
- * @param {text or string} input input data
- * @param {number} str_len optional size of lines or 0 if split is not needed
- * @return {rspamd_text} encoded data chunk
- */
- LUA_FUNCTION_DEF(util, encode_qp);
-
- /***
- * @function util.decode_qp(input)
- * Decodes data from quoted printable
- * @param {text or string} input input data
- * @return {rspamd_text} decoded data chunk
- */
- LUA_FUNCTION_DEF(util, decode_qp);
-
- /***
- * @function util.decode_base64(input)
- * Decodes data from base64 ignoring whitespace characters
- * @param {text or string} input data to decode; if `rspamd{text}` is used then the string is modified **in-place**
- * @return {rspamd_text} decoded data chunk
- */
- LUA_FUNCTION_DEF(util, decode_base64);
-
- /***
- * @function util.encode_base32(input, [b32type = 'default'])
- * Encodes data in base32 breaking lines if needed
- * @param {text or string} input input data
- * @param {string} b32type base32 type (default, bleach, rfc)
- * @return {rspamd_text} encoded data chunk
- */
- LUA_FUNCTION_DEF(util, encode_base32);
- /***
- * @function util.decode_base32(input, [b32type = 'default'])
- * Decodes data from base32 ignoring whitespace characters
- * @param {text or string} input data to decode
- * @param {string} b32type base32 type (default, bleach, rfc)
- * @return {rspamd_text} decoded data chunk
- */
- LUA_FUNCTION_DEF(util, decode_base32);
-
- /***
- * @function util.decode_url(input)
- * Decodes data from url encoding
- * @param {text or string} input data to decode
- * @return {rspamd_text} decoded data chunk
- */
- LUA_FUNCTION_DEF(util, decode_url);
-
- /***
- * @function util.tokenize_text(input[, exceptions])
- * Create tokens from a text using optional exceptions list
- * @param {text/string} input input data
- * @param {table} exceptions, a table of pairs containing <start_pos,length> of exceptions in the input
- * @return {table/strings} list of strings representing words in the text
- */
- LUA_FUNCTION_DEF(util, tokenize_text);
- LUA_FUNCTION_DEF(util, process_message);
- /***
- * @function util.tanh(num)
- * Calculates hyperbolic tangent of the specified floating point value
- * @param {number} num input number
- * @return {number} hyperbolic tangent of the variable
- */
- LUA_FUNCTION_DEF(util, tanh);
-
- /***
- * @function util.parse_html(input)
- * Parses HTML and returns the according text
- * @param {string|text} in input HTML
- * @return {rspamd_text} processed text with no HTML tags
- */
- LUA_FUNCTION_DEF(util, parse_html);
-
- /***
- * @function util.levenshtein_distance(s1, s2)
- * Returns levenstein distance between two strings
- * @param {string} s1 the first string
- * @param {string} s2 the second string
- * @return {number} number of differences in two strings
- */
- LUA_FUNCTION_DEF(util, levenshtein_distance);
-
- /***
- * @function util.fold_header(name, value, [how, [stop_chars]])
- * Fold rfc822 header according to the folding rules
- *
- * @param {string} name name of the header
- * @param {string} value value of the header
- * @param {string} how "cr" for \r, "lf" for \n and "crlf" for \r\n (default)
- * @param {string} stop_chars also fold header when the
- * @return {string} Folded value of the header
- */
- LUA_FUNCTION_DEF(util, fold_header);
-
- /***
- * @function util.is_uppercase(str)
- * Returns true if a string is all uppercase
- *
- * @param {string} str input string
- * @return {bool} true if a string is all uppercase
- */
- LUA_FUNCTION_DEF(util, is_uppercase);
-
- /***
- * @function util.humanize_number(num)
- * Returns humanized representation of given number (like 1k instead of 1000)
- *
- * @param {number} num number to humanize
- * @return {string} humanized representation of a number
- */
- LUA_FUNCTION_DEF(util, humanize_number);
-
- /***
- * @function util.get_tld(host)
- * Returns effective second level domain part (eSLD) for the specified host
- *
- * @param {string} host hostname
- * @return {string} eSLD part of the hostname or the full hostname if eSLD was not found
- */
- LUA_FUNCTION_DEF(util, get_tld);
-
- /***
- * @function util.glob(pattern)
- * Returns results for the glob match for the specified pattern
- *
- * @param {string} pattern glob pattern to match ('?' and '*' are supported)
- * @return {table/string} list of matched files
- */
- LUA_FUNCTION_DEF(util, glob);
-
- /***
- * @function util.parse_mail_address(str, [pool])
- * Parses email address and returns a table of tables in the following format:
- *
- * - `raw` - the original value without any processing
- * - `name` - name of internet address in UTF8, e.g. for `Vsevolod Stakhov <blah@foo.com>` it returns `Vsevolod Stakhov`
- * - `addr` - address part of the address
- * - `user` - user part (if present) of the address, e.g. `blah`
- * - `domain` - domain part (if present), e.g. `foo.com`
- * - `flags` - table with following keys set to true if given condition fulfilled:
- * - [valid] - valid SMTP address in conformity with https://tools.ietf.org/html/rfc5321#section-4.1.
- * - [ip] - domain is IPv4/IPv6 address
- * - [braced] - angled `<blah@foo.com>` address
- * - [quoted] - quoted user part
- * - [empty] - empty address
- * - [backslash] - user part contains backslash
- * - [8bit] - contains 8bit characters
- *
- * @param {string} str input string
- * @param {rspamd_mempool} pool memory pool to use
- * @return {table/tables} parsed list of mail addresses
- */
- LUA_FUNCTION_DEF(util, parse_mail_address);
-
- /***
- * @function util.strlen_utf8(str)
- * Returns length of string encoded in utf-8 in characters.
- * If invalid characters are found, then this function returns number of bytes.
- * @param {string} str utf8 encoded string
- * @return {number} number of characters in string
- */
- LUA_FUNCTION_DEF(util, strlen_utf8);
-
- /***
- * @function util.lower_utf8(str)
- * Converts utf8 string to lower case
- * @param {string} str utf8 encoded string
- * @return {string} lowercased utf8 string
- */
- LUA_FUNCTION_DEF(util, lower_utf8);
-
- /***
- * @function util.normalize_utf8(str)
- * Gets a string in UTF8 and normalises it to NFKC_Casefold form
- * @param {string} str utf8 encoded string
- * @return {string,integer} lowercased utf8 string + result of the normalisation (use bit.band to check):
- * RSPAMD_UNICODE_NORM_NORMAL = 0,
- * RSPAMD_UNICODE_NORM_UNNORMAL = (1 << 0),
- * RSPAMD_UNICODE_NORM_ZERO_SPACES = (1 << 1),
- * RSPAMD_UNICODE_NORM_ERROR = (1 << 2),
- * RSPAMD_UNICODE_NORM_OVERFLOW = (1 << 3)
- */
- LUA_FUNCTION_DEF(util, normalize_utf8);
-
-
- /***
- * @function util.transliterate(str)
- * Converts utf8 encoded string to latin transliteration
- * @param {string/text} str utf8 encoded string
- * @return {text} transliterated string
- */
- LUA_FUNCTION_DEF(util, transliterate);
-
- /***
- * @function util.strequal_caseless(str1, str2)
- * Compares two strings regardless of their case using ascii comparison.
- * Returns `true` if `str1` is equal to `str2`
- * @param {string} str1 utf8 encoded string
- * @param {string} str2 utf8 encoded string
- * @return {bool} result of comparison
- */
- LUA_FUNCTION_DEF(util, strequal_caseless);
-
-
- /***
- * @function util.strequal_caseless_utf8(str1, str2)
- * Compares two utf8 strings regardless of their case using utf8 collation rules.
- * Returns `true` if `str1` is equal to `str2`
- * @param {string} str1 utf8 encoded string
- * @param {string} str2 utf8 encoded string
- * @return {bool} result of comparison
- */
- LUA_FUNCTION_DEF(util, strequal_caseless_utf8);
-
-
- /***
- * @function util.get_ticks()
- * Returns current number of ticks as floating point number
- * @return {number} number of current clock ticks (monotonically increasing)
- */
- LUA_FUNCTION_DEF(util, get_ticks);
-
- /***
- * @function util.get_time()
- * Returns current time as unix time in floating point representation
- * @return {number} number of seconds since 01.01.1970
- */
- LUA_FUNCTION_DEF(util, get_time);
-
- /***
- * @function util.time_to_string(seconds)
- * Converts time from Unix time to HTTP date format
- * @param {number} seconds unix timestamp
- * @return {string} date as HTTP date
- */
- LUA_FUNCTION_DEF(util, time_to_string);
-
- /***
- * @function util.stat(fname)
- * Performs stat(2) on a specified filepath and returns table of values
- *
- * - `size`: size of file in bytes
- * - `type`: type of filepath: `regular`, `directory`, `special`
- * - `mtime`: modification time as unix time
- *
- * @return {string,table} string is returned when error is occurred
- * @example
- *
- * local err,st = util.stat('/etc/password')
- *
- * if err then
- * -- handle error
- * else
- * print(st['size'])
- * end
- */
- LUA_FUNCTION_DEF(util, stat);
-
- /***
- * @function util.unlink(fname)
- * Removes the specified file from the filesystem
- *
- * @param {string} fname filename to remove
- * @return {boolean,[string]} true if file has been deleted or false,'error string'
- */
- LUA_FUNCTION_DEF(util, unlink);
-
- /***
- * @function util.lock_file(fname, [fd])
- * Lock the specified file. This function returns {number} which must be passed to `util.unlock_file` after usage
- * or you'll have a resource leak
- *
- * @param {string} fname filename to lock
- * @param {number} fd use the specified fd instead of opening one
- * @return {number|nil,string} number if locking was successful or nil + error otherwise
- */
- LUA_FUNCTION_DEF(util, lock_file);
-
- /***
- * @function util.unlock_file(fd, [close_fd])
- * Unlock the specified file closing the file descriptor associated.
- *
- * @param {number} fd descriptor to unlock
- * @param {boolean} close_fd close descriptor on unlocking (default: TRUE)
- * @return {boolean[,string]} true if a file was unlocked
- */
- LUA_FUNCTION_DEF(util, unlock_file);
-
- /***
- * @function util.create_file(fname, [mode])
- * Creates the specified file with the default mode 0644
- *
- * @param {string} fname filename to create
- * @param {number} mode open mode (you should use octal number here)
- * @return {number|nil,string} file descriptor or pair nil + error string
- */
- LUA_FUNCTION_DEF(util, create_file);
-
- /***
- * @function util.close_file(fd)
- * Closes descriptor fd
- *
- * @param {number} fd descriptor to close
- * @return {boolean[,string]} true if a file was closed
- */
- LUA_FUNCTION_DEF(util, close_file);
-
- /***
- * @function util.random_hex(size)
- * Returns random hex string of the specified size
- *
- * @param {number} len length of desired string in bytes
- * @return {string} string with random hex digests
- */
- LUA_FUNCTION_DEF(util, random_hex);
-
- /***
- * @function util.zstd_compress(data, [level=1])
- * Compresses input using zstd compression
- *
- * @param {string/rspamd_text} data input data
- * @return {rspamd_text} compressed data
- */
- LUA_FUNCTION_DEF(util, zstd_compress);
-
- /***
- * @function util.zstd_decompress(data)
- * Decompresses input using zstd algorithm
- *
- * @param {string/rspamd_text} data compressed data
- * @return {error,rspamd_text} pair of error + decompressed text
- */
- LUA_FUNCTION_DEF(util, zstd_decompress);
-
- /***
- * @function util.gzip_decompress(data, [size_limit])
- * Decompresses input using gzip algorithm
- *
- * @param {string/rspamd_text} data compressed data
- * @param {integer} size_limit optional size limit
- * @return {rspamd_text} decompressed text
- */
- LUA_FUNCTION_DEF(util, gzip_decompress);
-
- /***
- * @function util.inflate(data, [size_limit])
- * Decompresses input using inflate algorithm
- *
- * @param {string/rspamd_text} data compressed data
- * @param {integer} size_limit optional size limit
- * @return {rspamd_text} decompressed text
- */
- LUA_FUNCTION_DEF(util, inflate);
-
- /***
- * @function util.gzip_compress(data, [level=1])
- * Compresses input using gzip compression
- *
- * @param {string/rspamd_text} data input data
- * @return {rspamd_text} compressed data
- */
- LUA_FUNCTION_DEF(util, gzip_compress);
-
- /***
- * @function util.normalize_prob(prob, [bias = 0.5])
- * Normalize probabilities using polynom
- *
- * @param {number} prob probability param
- * @param {number} bias number to subtract for making the final solution
- * @return {number} normalized number
- */
- LUA_FUNCTION_DEF(util, normalize_prob);
- /***
- * @function util.is_utf_spoofed(str, [str2])
- * Returns true if a string is spoofed (possibly with another string `str2`)
- * @return {boolean} true if a string is spoofed
- */
- LUA_FUNCTION_DEF(util, is_utf_spoofed);
-
- /**
- * @function util.is_utf_mixed_script(str)
- * Returns true if a string contains mixed unicode scripts
- * @param {string} String to check
- * @return {boolean} true if a string contains chars with mixed unicode script
- */
- LUA_FUNCTION_DEF(util, is_utf_mixed_script);
-
- /**
- * @function util.is_utf_outside_range(str, range_start, range_end)
- * Returns true if a string contains chars outside range
- * @param {string} String to check
- * @param {number} start of character range similar to uset_addRange
- * @param {number} end of character range similar to uset_addRange
- * @return {boolean} true if a string contains chars outside selected utf range
- */
- LUA_FUNCTION_DEF(util, is_utf_outside_range);
-
- /***
- * @function util.get_string_stats(str)
- * Returns table with number of letters and digits in string
- * @return {table} with string stats keys are "digits" and "letters"
- */
- LUA_FUNCTION_DEF(util, get_string_stats);
-
- /***
- * @function util.is_valid_utf8(str)
- * Returns true if a string is valid UTF8 string
- * @return {boolean} true if a string is spoofed
- */
- LUA_FUNCTION_DEF(util, is_valid_utf8);
-
- /***
- * @function util.has_obscured_unicode(str)
- * Returns true if a string has obscure UTF symbols (zero width spaces, order marks), ignores invalid utf characters
- * @return {boolean} true if a has obscured unicode characters (+ character and offset if found)
- */
- LUA_FUNCTION_DEF(util, has_obscured_unicode);
-
- /***
- * @function util.readline([prompt])
- * Returns string read from stdin with history and editing support
- * @return {string} string read from the input (with line endings stripped)
- */
- LUA_FUNCTION_DEF(util, readline);
-
- /***
- * @function util.readpassphrase([prompt])
- * Returns string read from stdin disabling echo
- * @return {string} string read from the input (with line endings stripped)
- */
- LUA_FUNCTION_DEF(util, readpassphrase);
-
- /***
- * @function util.file_exists(file)
- * Checks if a specified file exists and is available for reading
- * @return {boolean,string} true if file exists + string error if not
- */
- LUA_FUNCTION_DEF(util, file_exists);
-
- /***
- * @function util.mkdir(dir[, recursive])
- * Creates a specified directory
- * @return {boolean[,error]} true if directory has been created
- */
- LUA_FUNCTION_DEF(util, mkdir);
-
- /***
- * @function util.umask(mask)
- * Sets new umask. Accepts either numeric octal string, e.g. '022' or a plain
- * number, e.g. 0x12 (since Lua does not support octal integrals)
- * @return {number} old umask
- */
- LUA_FUNCTION_DEF(util, umask);
-
- /***
- * @function util.isatty()
- * Returns if stdout is a tty
- * @return {boolean} true in case of output being tty
- */
- LUA_FUNCTION_DEF(util, isatty);
-
- /***
- * @function util.pack(fmt, ...)
- *
- * Backport of Lua 5.3 `string.pack` function:
- * Returns a binary string containing the values v1, v2, etc. packed (that is,
- * serialized in binary form) according to the format string `fmt`
- * A format string is a sequence of conversion options. The conversion
- * options are as follows:
- *
- * * <: sets little endian
- * * >: sets big endian
- * * =: sets native endian
- * * ![n]: sets maximum alignment to n (default is native alignment)
- * * b: a signed byte (char)
- * * B: an unsigned byte (char)
- * * h: a signed short (native size)
- * * H: an unsigned short (native size)
- * * l: a signed long (native size)
- * * L: an unsigned long (native size)
- * * j: a lua_Integer
- * * J: a lua_Unsigned
- * * T: a size_t (native size)
- * * i[n]: a signed int with n bytes (default is native size)
- * * I[n]: an unsigned int with n bytes (default is native size)
- * * f: a float (native size)
- * * d: a double (native size)
- * * n: a lua_Number
- * * cn: a fixed-sized string with n bytes
- * * z: a zero-terminated string
- * * s[n]: a string preceded by its length coded as an unsigned integer with
- * * n bytes (default is a size_t)
- * * x: one byte of padding
- * * Xop: an empty item that aligns according to option op (which is otherwise ignored)
- * * ' ': (empty space) ignored
- *
- * (A "[n]" means an optional integral numeral.) Except for padding, spaces,
- * and configurations (options "xX <=>!"), each option corresponds to an
- * argument (in string.pack) or a result (in string.unpack).
- *
- * For options "!n", "sn", "in", and "In", n can be any integer between 1 and
- * All integral options check overflows; string.pack checks whether the given
- * value fits in the given size; string.unpack checks whether the read value
- * fits in a Lua integer.
- *
- * Any format string starts as if prefixed by "!1=", that is, with maximum
- * alignment of 1 (no alignment) and native endianness.
- *
- * Alignment works as follows: For each option, the format gets extra padding
- * until the data starts at an offset that is a multiple of the minimum
- * between the option size and the maximum alignment; this minimum must be a
- * power of 2. Options "c" and "z" are not aligned; option "s" follows the
- * alignment of its starting integer.
- *
- * All padding is filled with zeros by string.pack (and ignored by unpack).
- */
- LUA_FUNCTION_DEF(util, pack);
-
- /***
- * @function util.packsize(fmt)
- *
- * Returns size of the packed binary string returned for the same `fmt` argument
- * by @see util.pack
- */
- LUA_FUNCTION_DEF(util, packsize);
-
- /***
- * @function util.unpack(fmt, s [, pos])
- * Unpacks string `s` according to the format string `fmt` as described in
- * @see util.pack
- *
- * @returns {multiple} list of unpacked values according to `fmt`
- */
- LUA_FUNCTION_DEF(util, unpack);
-
- /***
- * @function util.caseless_hash(str[, seed])
- * Calculates caseless non-crypto hash from a string or rspamd text
- * @param str string or lua_text
- * @param seed mandatory seed (0xdeadbabe by default)
- * @return {int64} boxed int64_t
- */
- LUA_FUNCTION_DEF(util, caseless_hash);
-
- /***
- * @function util.caseless_hash_fast(str[, seed])
- * Calculates caseless non-crypto hash from a string or rspamd text
- * @param str string or lua_text
- * @param seed mandatory seed (0xdeadbabe by default)
- * @return {number} number from int64_t
- */
- LUA_FUNCTION_DEF(util, caseless_hash_fast);
-
- /***
- * @function util.get_hostname()
- * Returns hostname for this machine
- * @return {string} hostname
- */
- LUA_FUNCTION_DEF(util, get_hostname);
-
- /***
- * @function util.parse_content_type(ct_string, mempool)
- * Parses content-type string to a table:
- * - `type`
- * - `subtype`
- * - `charset`
- * - `boundary`
- * - other attributes
- *
- * @param {string} ct_string content type as string
- * @param {rspamd_mempool} mempool needed to store temporary data (e.g. task pool)
- * @return table or nil if cannot parse content type
- */
- LUA_FUNCTION_DEF(util, parse_content_type);
-
- /***
- * @function util.mime_header_encode(hdr)
- * Encodes header if needed
- * @param {string} hdr input header
- * @return encoded header
- */
- LUA_FUNCTION_DEF(util, mime_header_encode);
-
- /***
- * @function util.btc_polymod(input_values)
- * Performs bitcoin polymod function
- * @param {table|numbers} input_values
- * @return {boolean} true if polymod has been successful
- */
- LUA_FUNCTION_DEF(util, btc_polymod);
-
- /***
- * @function util.parse_smtp_date(str[, local_tz])
- * Converts an SMTP date string to unix timestamp
- * @param {string} str input string
- * @param {boolean} local_tz convert to local tz if `true`
- * @return {number} time as unix timestamp (converted to float)
- */
- LUA_FUNCTION_DEF(util, parse_smtp_date);
-
-
- static const struct luaL_reg utillib_f[] = {
- LUA_INTERFACE_DEF(util, create_event_base),
- LUA_INTERFACE_DEF(util, load_rspamd_config),
- LUA_INTERFACE_DEF(util, config_from_ucl),
- LUA_INTERFACE_DEF(util, process_message),
- LUA_INTERFACE_DEF(util, encode_base64),
- LUA_INTERFACE_DEF(util, encode_qp),
- LUA_INTERFACE_DEF(util, decode_qp),
- LUA_INTERFACE_DEF(util, decode_base64),
- LUA_INTERFACE_DEF(util, encode_base32),
- LUA_INTERFACE_DEF(util, decode_base32),
- LUA_INTERFACE_DEF(util, decode_url),
- LUA_INTERFACE_DEF(util, tokenize_text),
- LUA_INTERFACE_DEF(util, tanh),
- LUA_INTERFACE_DEF(util, parse_html),
- LUA_INTERFACE_DEF(util, levenshtein_distance),
- LUA_INTERFACE_DEF(util, fold_header),
- LUA_INTERFACE_DEF(util, is_uppercase),
- LUA_INTERFACE_DEF(util, humanize_number),
- LUA_INTERFACE_DEF(util, get_tld),
- LUA_INTERFACE_DEF(util, glob),
- {"parse_addr", lua_util_parse_mail_address},
- LUA_INTERFACE_DEF(util, parse_mail_address),
- LUA_INTERFACE_DEF(util, strlen_utf8),
- LUA_INTERFACE_DEF(util, lower_utf8),
- LUA_INTERFACE_DEF(util, normalize_utf8),
- LUA_INTERFACE_DEF(util, transliterate),
- LUA_INTERFACE_DEF(util, strequal_caseless),
- LUA_INTERFACE_DEF(util, strequal_caseless_utf8),
- LUA_INTERFACE_DEF(util, get_ticks),
- LUA_INTERFACE_DEF(util, get_time),
- LUA_INTERFACE_DEF(util, time_to_string),
- LUA_INTERFACE_DEF(util, stat),
- LUA_INTERFACE_DEF(util, unlink),
- LUA_INTERFACE_DEF(util, lock_file),
- LUA_INTERFACE_DEF(util, unlock_file),
- LUA_INTERFACE_DEF(util, create_file),
- LUA_INTERFACE_DEF(util, close_file),
- LUA_INTERFACE_DEF(util, random_hex),
- LUA_INTERFACE_DEF(util, zstd_compress),
- LUA_INTERFACE_DEF(util, zstd_decompress),
- LUA_INTERFACE_DEF(util, gzip_compress),
- LUA_INTERFACE_DEF(util, gzip_decompress),
- LUA_INTERFACE_DEF(util, inflate),
- LUA_INTERFACE_DEF(util, normalize_prob),
- LUA_INTERFACE_DEF(util, caseless_hash),
- LUA_INTERFACE_DEF(util, caseless_hash_fast),
- LUA_INTERFACE_DEF(util, is_utf_spoofed),
- LUA_INTERFACE_DEF(util, is_utf_mixed_script),
- LUA_INTERFACE_DEF(util, is_utf_outside_range),
- LUA_INTERFACE_DEF(util, get_string_stats),
- LUA_INTERFACE_DEF(util, is_valid_utf8),
- LUA_INTERFACE_DEF(util, has_obscured_unicode),
- LUA_INTERFACE_DEF(util, readline),
- LUA_INTERFACE_DEF(util, readpassphrase),
- LUA_INTERFACE_DEF(util, file_exists),
- LUA_INTERFACE_DEF(util, mkdir),
- LUA_INTERFACE_DEF(util, umask),
- LUA_INTERFACE_DEF(util, isatty),
- LUA_INTERFACE_DEF(util, get_hostname),
- LUA_INTERFACE_DEF(util, parse_content_type),
- LUA_INTERFACE_DEF(util, mime_header_encode),
- LUA_INTERFACE_DEF(util, pack),
- LUA_INTERFACE_DEF(util, unpack),
- LUA_INTERFACE_DEF(util, packsize),
- LUA_INTERFACE_DEF(util, btc_polymod),
- LUA_INTERFACE_DEF(util, parse_smtp_date),
- {NULL, NULL}};
-
- LUA_FUNCTION_DEF(int64, tostring);
- LUA_FUNCTION_DEF(int64, fromstring);
- LUA_FUNCTION_DEF(int64, tonumber);
- LUA_FUNCTION_DEF(int64, hex);
-
- static const struct luaL_reg int64lib_f[] = {
- LUA_INTERFACE_DEF(int64, fromstring),
- {NULL, NULL}};
- static const struct luaL_reg int64lib_m[] = {
- LUA_INTERFACE_DEF(int64, tostring),
- LUA_INTERFACE_DEF(int64, tonumber),
- LUA_INTERFACE_DEF(int64, hex),
- {"__tostring", lua_int64_tostring},
- {NULL, NULL}};
-
- LUA_FUNCTION_DEF(ev_base, loop);
-
- static const struct luaL_reg ev_baselib_m[] = {
- LUA_INTERFACE_DEF(ev_base, loop),
- {"__tostring", rspamd_lua_class_tostring},
- {NULL, NULL}};
-
- static int64_t
- lua_check_int64(lua_State *L, int pos)
- {
- void *ud = rspamd_lua_check_udata(L, pos, rspamd_int64_classname);
- luaL_argcheck(L, ud != NULL, pos, "'int64' expected");
- return ud ? *((int64_t *) ud) : 0LL;
- }
-
-
- static int
- lua_util_create_event_base(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct ev_loop **pev_base;
-
- pev_base = lua_newuserdata(L, sizeof(struct ev_loop *));
- rspamd_lua_setclass(L, rspamd_ev_base_classname, -1);
- *pev_base = ev_loop_new(EVFLAG_SIGNALFD | EVBACKEND_ALL);
-
- return 1;
- }
-
- static int
- lua_util_load_rspamd_config(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_config *cfg, **pcfg;
- const char *cfg_name;
-
- cfg_name = luaL_checkstring(L, 1);
-
- if (cfg_name) {
- cfg = rspamd_config_new(RSPAMD_CONFIG_INIT_SKIP_LUA);
- cfg->lua_state = L;
-
- if (rspamd_config_read(cfg, cfg_name, NULL, NULL, NULL, FALSE, NULL)) {
- msg_err_config("cannot load config from %s", cfg_name);
- lua_pushnil(L);
- }
- else {
- rspamd_config_post_load(cfg, 0);
- pcfg = lua_newuserdata(L, sizeof(struct rspamd_config *));
- rspamd_lua_setclass(L, rspamd_config_classname, -1);
- *pcfg = cfg;
- }
- }
-
- return 1;
- }
-
- static int
- parse_config_options(const char *str_options)
- {
- int ret = 0;
- char **vec;
- const char *str;
- unsigned int i, l;
-
- vec = g_strsplit_set(str_options, ",;", -1);
- if (vec) {
- l = g_strv_length(vec);
- for (i = 0; i < l; i++) {
- str = vec[i];
-
- if (g_ascii_strcasecmp(str, "INIT_URL") == 0) {
- ret |= RSPAMD_CONFIG_INIT_URL;
- }
- else if (g_ascii_strcasecmp(str, "INIT_LIBS") == 0) {
- ret |= RSPAMD_CONFIG_INIT_LIBS;
- }
- else if (g_ascii_strcasecmp(str, "INIT_SYMCACHE") == 0) {
- ret |= RSPAMD_CONFIG_INIT_SYMCACHE;
- }
- else if (g_ascii_strcasecmp(str, "INIT_VALIDATE") == 0) {
- ret |= RSPAMD_CONFIG_INIT_VALIDATE;
- }
- else if (g_ascii_strcasecmp(str, "INIT_NO_TLD") == 0) {
- ret |= RSPAMD_CONFIG_INIT_NO_TLD;
- }
- else if (g_ascii_strcasecmp(str, "INIT_PRELOAD_MAPS") == 0) {
- ret |= RSPAMD_CONFIG_INIT_PRELOAD_MAPS;
- }
- else {
- msg_warn("bad type: %s", str);
- }
- }
-
- g_strfreev(vec);
- }
-
- return ret;
- }
-
- static int
- lua_util_config_from_ucl(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_config *cfg = NULL, **pcfg;
- struct rspamd_rcl_sections_map *top;
- GError *err = NULL;
- ucl_object_t *obj;
- const char *str_options = NULL;
- int int_options = 0;
-
-
- obj = ucl_object_lua_import(L, 1);
- if (lua_gettop(L) == 2) {
- if (lua_type(L, 2) == LUA_TSTRING) {
- str_options = lua_tostring(L, 2);
- int_options = parse_config_options(str_options);
- }
- else {
- msg_err("config_from_ucl: second parameter is expected to be string");
- ucl_object_unref(obj);
- lua_pushnil(L);
- }
- }
-
- if (obj) {
- cfg = rspamd_config_new(RSPAMD_CONFIG_INIT_SKIP_LUA);
- cfg->lua_state = L;
-
- cfg->cfg_ucl_obj = obj;
- top = rspamd_rcl_config_init(cfg, NULL);
-
- if (!rspamd_rcl_parse(top, cfg, cfg, cfg->cfg_pool, cfg->cfg_ucl_obj, &err)) {
- msg_err("rcl parse error: %s", err->message);
- ucl_object_unref(obj);
- lua_pushnil(L);
- }
- else {
-
- if (int_options & RSPAMD_CONFIG_INIT_LIBS) {
- cfg->libs_ctx = rspamd_init_libs();
- }
-
- rspamd_config_post_load(cfg, int_options);
- pcfg = lua_newuserdata(L, sizeof(struct rspamd_config *));
- rspamd_lua_setclass(L, rspamd_config_classname, -1);
- *pcfg = cfg;
- }
-
- rspamd_rcl_sections_free(top);
- }
-
- return 1;
- }
-
- static gboolean
- lua_util_task_fin(struct rspamd_task *task, void *ud)
- {
- ucl_object_t **target = ud;
-
- *target = rspamd_protocol_write_ucl(task, RSPAMD_PROTOCOL_DEFAULT);
- rdns_resolver_release(task->resolver->r);
-
- return TRUE;
- }
-
- static int
- lua_util_process_message(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_config *cfg = lua_check_config(L, 1);
- const char *message;
- gsize mlen;
- struct rspamd_task *task;
- struct ev_loop *base;
- ucl_object_t *res = NULL;
-
- message = luaL_checklstring(L, 2, &mlen);
-
- if (cfg != NULL && message != NULL) {
- base = ev_loop_new(EVFLAG_SIGNALFD | EVBACKEND_ALL);
- rspamd_init_filters(cfg, false, false);
- task = rspamd_task_new(NULL, cfg, NULL, NULL, base, FALSE);
- task->msg.begin = rspamd_mempool_alloc(task->task_pool, mlen);
- rspamd_strlcpy((gpointer) task->msg.begin, message, mlen);
- task->msg.len = mlen;
- task->fin_callback = lua_util_task_fin;
- task->fin_arg = &res;
- task->resolver = rspamd_dns_resolver_init(NULL, base, cfg);
- task->s = rspamd_session_create(task->task_pool, rspamd_task_fin,
- NULL, (event_finalizer_t) rspamd_task_free, task);
-
- if (!rspamd_task_load_message(task, NULL, message, mlen)) {
- lua_pushnil(L);
- }
- else {
- if (rspamd_task_process(task, RSPAMD_TASK_PROCESS_ALL)) {
- ev_loop(base, 0);
-
- if (res != NULL) {
- ucl_object_push_lua(L, res, true);
-
- ucl_object_unref(res);
- }
- else {
- ucl_object_push_lua(L,
- rspamd_protocol_write_ucl(task, RSPAMD_PROTOCOL_DEFAULT),
- true);
- rdns_resolver_release(task->resolver->r);
- rspamd_session_destroy(task->s);
- }
- }
- else {
- lua_pushnil(L);
- }
- }
-
- ev_loop_destroy(base);
- }
- else {
- lua_pushnil(L);
- }
-
- return 1;
- }
-
- static int
- lua_util_encode_base64(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
- char *out;
- gsize outlen;
- long str_lim = 0;
- gboolean fold = FALSE;
-
- t = lua_check_text_or_string(L, 1);
-
- if (lua_gettop(L) > 1) {
- str_lim = luaL_checkinteger(L, 2);
- fold = str_lim > 0;
- }
-
- if (t == NULL) {
- return luaL_error(L, "invalid arguments");
- }
- else {
-
- if (fold) {
- out = rspamd_encode_base64(t->start, t->len, str_lim, &outlen);
- }
- else {
- enum rspamd_newlines_type how = RSPAMD_TASK_NEWLINES_CRLF;
-
- if (lua_type(L, 3) == LUA_TSTRING) {
- const char *how_str = lua_tostring(L, 3);
-
- if (g_ascii_strcasecmp(how_str, "cr") == 0) {
- how = RSPAMD_TASK_NEWLINES_CR;
- }
- else if (g_ascii_strcasecmp(how_str, "lf") == 0) {
- how = RSPAMD_TASK_NEWLINES_LF;
- }
- else if (g_ascii_strcasecmp(how_str, "crlf") != 0) {
- return luaL_error(L, "invalid newline style: %s", how_str);
- }
- }
-
- out = rspamd_encode_base64_fold(t->start, t->len, str_lim, &outlen, how);
- }
-
- if (out != NULL) {
- lua_new_text(L, out, outlen, TRUE);
- }
- else {
- lua_pushnil(L);
- }
- }
-
- return 1;
- }
-
- static int
- lua_util_encode_qp(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
- const char *s = NULL;
- char *out;
- gsize inlen, outlen;
- unsigned int str_lim = 0;
-
- if (lua_type(L, 1) == LUA_TSTRING) {
- s = luaL_checklstring(L, 1, &inlen);
- }
- else if (lua_type(L, 1) == LUA_TUSERDATA) {
- t = lua_check_text(L, 1);
-
- if (t != NULL) {
- s = t->start;
- inlen = t->len;
- }
- }
-
- if (lua_gettop(L) > 1) {
- str_lim = luaL_checknumber(L, 2);
- }
-
- if (s == NULL) {
- lua_pushnil(L);
- }
- else {
- enum rspamd_newlines_type how = RSPAMD_TASK_NEWLINES_CRLF;
-
- if (lua_type(L, 3) == LUA_TSTRING) {
- const char *how_str = lua_tostring(L, 3);
-
- if (g_ascii_strcasecmp(how_str, "cr") == 0) {
- how = RSPAMD_TASK_NEWLINES_CR;
- }
- else if (g_ascii_strcasecmp(how_str, "lf") == 0) {
- how = RSPAMD_TASK_NEWLINES_LF;
- }
- else if (g_ascii_strcasecmp(how_str, "crlf") != 0) {
- return luaL_error(L, "invalid newline style: %s", how_str);
- }
- }
-
- out = rspamd_encode_qp_fold(s, inlen, str_lim, &outlen, how);
-
- if (out != NULL) {
- t = lua_newuserdata(L, sizeof(*t));
- rspamd_lua_setclass(L, rspamd_text_classname, -1);
- t->start = out;
- t->len = outlen;
- /* Need destruction */
- t->flags = RSPAMD_TEXT_FLAG_OWN;
- }
- else {
- lua_pushnil(L);
- }
- }
-
- return 1;
- }
-
- static int
- lua_util_decode_qp(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t, *out;
- const char *s = NULL;
- gsize inlen = 0;
- gssize outlen;
-
- if (lua_type(L, 1) == LUA_TSTRING) {
- s = luaL_checklstring(L, 1, &inlen);
- }
- else if (lua_type(L, 1) == LUA_TUSERDATA) {
- t = lua_check_text(L, 1);
-
- if (t != NULL) {
- s = t->start;
- inlen = t->len;
- }
- }
-
- if (s == NULL) {
- lua_pushnil(L);
- }
- else {
- out = lua_newuserdata(L, sizeof(*t));
- rspamd_lua_setclass(L, rspamd_text_classname, -1);
- out->start = g_malloc(inlen + 1);
- out->flags = RSPAMD_TEXT_FLAG_OWN;
- outlen = rspamd_decode_qp_buf(s, inlen, (char *) out->start, inlen + 1);
-
- if (outlen > 0) {
- out->len = outlen;
- }
- else {
- /*
- * It removes out and frees memory on gc due to RSPAMD_TEXT_FLAG_OWN
- */
- lua_pop(L, 1);
- lua_pushnil(L);
- }
- }
-
- return 1;
- }
-
- static int
- lua_util_decode_base64(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
- const char *s = NULL;
- gsize inlen = 0, outlen;
-
- if (lua_type(L, 1) == LUA_TSTRING) {
- s = luaL_checklstring(L, 1, &inlen);
- }
- else if (lua_type(L, 1) == LUA_TUSERDATA) {
- t = lua_check_text(L, 1);
-
- if (t != NULL) {
- s = t->start;
- inlen = t->len;
- }
- }
-
- if (s != NULL) {
- t = lua_newuserdata(L, sizeof(*t));
- rspamd_lua_setclass(L, rspamd_text_classname, -1);
- t->len = (inlen / 4) * 3 + 3;
- t->start = g_malloc(t->len);
-
- rspamd_cryptobox_base64_decode(s, inlen, (unsigned char *) t->start,
- &outlen);
- t->len = outlen;
- t->flags = RSPAMD_TEXT_FLAG_OWN;
- }
- else {
- lua_pushnil(L);
- }
-
- return 1;
- }
-
- static int
- lua_util_encode_base32(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
- const char *s = NULL;
- char *out;
- enum rspamd_base32_type btype = RSPAMD_BASE32_DEFAULT;
- gsize inlen, outlen;
-
- if (lua_type(L, 1) == LUA_TSTRING) {
- s = luaL_checklstring(L, 1, &inlen);
- }
- else if (lua_type(L, 1) == LUA_TUSERDATA) {
- t = lua_check_text(L, 1);
-
- if (t != NULL) {
- s = t->start;
- inlen = t->len;
- }
- }
-
- if (lua_type(L, 2) == LUA_TSTRING) {
- btype = rspamd_base32_decode_type_from_str(lua_tostring(L, 2));
-
- if (btype == RSPAMD_BASE32_INVALID) {
- return luaL_error(L, "invalid b32 type: %s", lua_tostring(L, 2));
- }
- }
-
- if (s == NULL) {
- return luaL_error(L, "invalid arguments");
- }
- else {
- out = rspamd_encode_base32(s, inlen, btype);
-
- if (out != NULL) {
- t = lua_newuserdata(L, sizeof(*t));
- outlen = strlen(out);
- rspamd_lua_setclass(L, rspamd_text_classname, -1);
- t->start = out;
- t->len = outlen;
- /* Need destruction */
- t->flags = RSPAMD_TEXT_FLAG_OWN;
- }
- else {
- lua_pushnil(L);
- }
- }
-
- return 1;
- }
-
- static int
- lua_util_decode_base32(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
- const char *s = NULL;
- gsize inlen, outlen;
- enum rspamd_base32_type btype = RSPAMD_BASE32_DEFAULT;
-
- if (lua_type(L, 1) == LUA_TSTRING) {
- s = luaL_checklstring(L, 1, &inlen);
- }
- else if (lua_type(L, 1) == LUA_TUSERDATA) {
- t = lua_check_text(L, 1);
-
- if (t != NULL) {
- s = t->start;
- inlen = t->len;
- }
- }
-
- if (lua_type(L, 2) == LUA_TSTRING) {
- btype = rspamd_base32_decode_type_from_str(lua_tostring(L, 2));
-
- if (btype == RSPAMD_BASE32_INVALID) {
- return luaL_error(L, "invalid b32 type: %s", lua_tostring(L, 2));
- }
- }
-
- if (s != NULL) {
- unsigned char *decoded;
-
- decoded = rspamd_decode_base32(s, inlen, &outlen, btype);
-
- if (decoded) {
- t = lua_newuserdata(L, sizeof(*t));
- rspamd_lua_setclass(L, rspamd_text_classname, -1);
- t->start = (const char *) decoded;
- t->len = outlen;
- t->flags = RSPAMD_TEXT_FLAG_OWN;
- }
- else {
- lua_pushnil(L);
- }
- }
- else {
- lua_pushnil(L);
- }
-
- return 1;
- }
-
- static int
- lua_util_decode_url(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
-
- t = lua_check_text_or_string(L, 1);
-
- if (t != NULL) {
- struct rspamd_lua_text *out = lua_new_text(L, NULL, t->len, TRUE);
-
- out->len = rspamd_url_decode((char *) out->start, t->start, t->len);
- }
- else {
- lua_pushnil(L);
- }
-
- return 1;
- }
-
-
- static int
- lua_util_tokenize_text(lua_State *L)
- {
- return lua_parsers_tokenize_text(L);
- }
-
- static int
- lua_util_tanh(lua_State *L)
- {
- LUA_TRACE_POINT;
- double in = luaL_checknumber(L, 1);
-
- lua_pushnumber(L, tanh(in));
-
- return 1;
- }
-
- static int
- lua_util_parse_html(lua_State *L)
- {
- return lua_parsers_parse_html(L);
- }
-
- static int
- lua_util_levenshtein_distance(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t1, *t2;
- int dist = 0;
- unsigned int replace_cost = 1;
-
- t1 = lua_check_text_or_string(L, 1);
- t2 = lua_check_text_or_string(L, 2);
- if (lua_isnumber(L, 3)) {
- replace_cost = lua_tointeger(L, 3);
- }
-
- if (t1 && t2) {
- dist = rspamd_strings_levenshtein_distance(t1->start, t1->len, t2->start, t2->len,
- replace_cost);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- lua_pushinteger(L, dist);
-
- return 1;
- }
-
- static int
- lua_util_fold_header(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *how, *stop_chars = NULL;
- struct rspamd_lua_text *name, *value;
- GString *folded;
-
- name = lua_check_text_or_string(L, 1);
- value = lua_check_text_or_string(L, 2);
-
- if (name && value) {
-
- if (lua_isstring(L, 3)) {
-
- how = lua_tostring(L, 3);
-
- if (lua_isstring(L, 4)) {
- stop_chars = lua_tostring(L, 4);
- }
-
- if (strcmp(how, "cr") == 0) {
- folded = rspamd_header_value_fold(name->start, name->len,
- value->start, value->len,
- 0,
- RSPAMD_TASK_NEWLINES_CR, stop_chars);
- }
- else if (strcmp(how, "lf") == 0) {
- folded = rspamd_header_value_fold(name->start, name->len,
- value->start, value->len, 0,
- RSPAMD_TASK_NEWLINES_LF, stop_chars);
- }
- else {
- folded = rspamd_header_value_fold(name->start, name->len,
- value->start, value->len, 0,
- RSPAMD_TASK_NEWLINES_CRLF, stop_chars);
- }
- }
- else {
- folded = rspamd_header_value_fold(name->start, name->len,
- value->start, value->len, 0,
- RSPAMD_TASK_NEWLINES_CRLF, stop_chars);
- }
-
- if (folded) {
- lua_pushlstring(L, folded->str, folded->len);
- g_string_free(folded, TRUE);
-
- return 1;
- }
- }
-
- lua_pushnil(L);
- return 1;
- }
-
- static int
- lua_util_is_uppercase(lua_State *L)
- {
- LUA_TRACE_POINT;
- int32_t i = 0;
- UChar32 uc;
- bool is_upper = false, is_lower = false, is_other = false;
-
- struct rspamd_lua_text *t = lua_check_text_or_string(L, 1);
- if (t) {
- while (i >= 0 && i < t->len) {
- U8_NEXT(t->start, i, t->len, uc);
-
- if (uc < 0) {
- break;
- }
-
- if (u_isupper(uc)) {
- is_upper = true;
- }
- else if (u_islower(uc)) {
- is_lower = true;
- break;
- }
- else if (u_charType(uc) == U_OTHER_LETTER) {
- is_other = true;
- break;
- }
- }
- }
-
- if (is_upper && !is_lower && !is_other) {
- lua_pushboolean(L, TRUE);
- }
- else {
- lua_pushboolean(L, FALSE);
- }
-
- return 1;
- }
-
- static int
- lua_util_humanize_number(lua_State *L)
- {
- LUA_TRACE_POINT;
- int64_t number = luaL_checkinteger(L, 1);
- char numbuf[32];
-
-
- rspamd_snprintf(numbuf, sizeof(numbuf), "%hL", number);
- lua_pushstring(L, numbuf);
-
- return 1;
- }
-
- static int
- lua_util_get_tld(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *host;
- gsize hostlen;
- rspamd_ftok_t tld;
-
- host = luaL_checklstring(L, 1, &hostlen);
-
- if (host) {
- if (!rspamd_url_find_tld(host, hostlen, &tld)) {
- lua_pushlstring(L, host, hostlen);
- }
- else {
- lua_pushlstring(L, tld.begin, tld.len);
- }
- }
- else {
- lua_pushnil(L);
- }
-
- return 1;
- }
-
-
- static int
- lua_util_glob(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *pattern;
- glob_t gl;
- int top, i, flags = 0;
-
- top = lua_gettop(L);
- memset(&gl, 0, sizeof(gl));
-
- for (i = 1; i <= top; i++, flags |= GLOB_APPEND) {
- pattern = luaL_checkstring(L, i);
-
- if (pattern) {
- if (glob(pattern, flags, NULL, &gl) != 0) {
- /* There is no way to return error here, so just create an table */
- lua_createtable(L, 0, 0);
- globfree(&gl);
-
- return 1;
- }
- }
- }
-
- lua_createtable(L, gl.gl_pathc, 0);
- /* Push results */
- for (i = 0; i < (int) gl.gl_pathc; i++) {
- lua_pushstring(L, gl.gl_pathv[i]);
- lua_rawseti(L, -2, i + 1);
- }
-
- globfree(&gl);
-
- return 1;
- }
-
- static int
- lua_util_parse_mail_address(lua_State *L)
- {
- return lua_parsers_parse_mail_address(L);
- }
-
- static int
- lua_util_strlen_utf8(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
-
- t = lua_check_text_or_string(L, 1);
-
- if (t) {
- int32_t i = 0, nchars = 0;
- UChar32 uc;
-
- while (i < t->len) {
- U8_NEXT((uint8_t *) t->start, i, t->len, uc);
- nchars++;
- }
-
- lua_pushinteger(L, nchars);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
- static int
- lua_util_lower_utf8(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
-
- char *dst;
- UChar32 uc;
- UBool err = 0;
- int32_t i = 0, j = 0;
-
- t = lua_check_text_or_string(L, 1);
-
- if (t) {
- dst = g_malloc(t->len);
-
- while (i < t->len && err == 0) {
- U8_NEXT((uint8_t *) t->start, i, t->len, uc);
- uc = u_tolower(uc);
- U8_APPEND(dst, j, t->len, uc, err);
- }
-
- if (lua_isstring(L, 1)) {
- lua_pushlstring(L, dst, j);
- g_free(dst);
- }
- else {
- t = lua_new_text(L, dst, j, FALSE);
- /* We have actually allocated text data before */
- t->flags |= RSPAMD_TEXT_FLAG_OWN;
- }
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
- static int
- lua_util_normalize_utf8(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
- bool is_text = lua_type(L, 1) == LUA_TUSERDATA;
-
- t = lua_check_text_or_string(L, 1);
-
- if (!t) {
- return luaL_error(L, "invalid arguments");
- }
-
- char *cpy = g_malloc(t->len + 1);
- memcpy(cpy, t->start, t->len);
- cpy[t->len] = '\0';
- gsize len = t->len;
- enum rspamd_utf8_normalise_result res = rspamd_normalise_unicode_inplace(cpy, &len);
-
- if (is_text) {
- struct rspamd_lua_text *out = lua_new_text(L, cpy, len, FALSE);
- out->flags |= RSPAMD_TEXT_FLAG_OWN;
- }
- else {
- lua_pushlstring(L, cpy, len);
- g_free(cpy);
- }
-
- lua_pushinteger(L, res);
-
- return 2;
- }
-
- static int
- lua_util_transliterate(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t;
- t = lua_check_text_or_string(L, 1);
-
- if (!t) {
- return luaL_error(L, "invalid arguments");
- }
-
- gsize outlen;
- char *transliterated = rspamd_utf8_transliterate(t->start, t->len, &outlen);
- lua_new_text(L, transliterated, outlen, TRUE);
-
- return 1;
- }
-
- static int
- lua_util_strequal_caseless(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t1, *t2;
- int ret = -1;
-
- t1 = lua_check_text_or_string(L, 1);
- t2 = lua_check_text_or_string(L, 2);
-
- if (t1 && t2) {
-
- if (t1->len == t2->len) {
- ret = rspamd_lc_cmp(t1->start, t2->start, t1->len);
- }
- else {
- ret = t1->len - t2->len;
- }
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- lua_pushboolean(L, (ret == 0) ? true : false);
- return 1;
- }
-
- static int
- lua_util_strequal_caseless_utf8(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t1, *t2;
- int ret = -1;
-
- t1 = lua_check_text_or_string(L, 1);
- t2 = lua_check_text_or_string(L, 2);
-
- if (t1 && t2) {
- ret = rspamd_utf8_strcmp_sizes(t1->start, t1->len, t2->start, t2->len);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- lua_pushboolean(L, (ret == 0) ? true : false);
-
- return 1;
- }
-
- static int
- lua_util_get_ticks(lua_State *L)
- {
- LUA_TRACE_POINT;
- double ticks;
- gboolean rdtsc = FALSE;
-
- if (lua_isboolean(L, 1)) {
- rdtsc = lua_toboolean(L, 1);
- }
-
- ticks = rspamd_get_ticks(rdtsc);
- lua_pushnumber(L, ticks);
-
- return 1;
- }
-
- static int
- lua_util_get_time(lua_State *L)
- {
- LUA_TRACE_POINT;
-
- lua_pushnumber(L, ev_time());
-
- return 1;
- }
-
- static int
- lua_util_time_to_string(lua_State *L)
- {
- LUA_TRACE_POINT;
- double seconds;
- char timebuf[128];
-
- if (lua_isnumber(L, 1)) {
- seconds = lua_tonumber(L, 1);
- }
- else {
- seconds = ev_time();
- }
-
- rspamd_http_date_format(timebuf, sizeof(timebuf), seconds);
- lua_pushstring(L, timebuf);
-
- return 1;
- }
-
- static int
- lua_util_stat(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *fpath;
- struct stat st;
-
- fpath = luaL_checkstring(L, 1);
-
- if (fpath) {
- if (stat(fpath, &st) == -1) {
- lua_pushstring(L, strerror(errno));
- lua_pushnil(L);
- }
- else {
- lua_pushnil(L);
- lua_createtable(L, 0, 3);
-
- lua_pushstring(L, "size");
- lua_pushinteger(L, st.st_size);
- lua_settable(L, -3);
-
- lua_pushstring(L, "mtime");
- lua_pushinteger(L, st.st_mtime);
- lua_settable(L, -3);
-
- lua_pushstring(L, "type");
- if (S_ISREG(st.st_mode)) {
- lua_pushstring(L, "regular");
- }
- else if (S_ISDIR(st.st_mode)) {
- lua_pushstring(L, "directory");
- }
- else {
- lua_pushstring(L, "special");
- }
- lua_settable(L, -3);
- }
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 2;
- }
-
- static int
- lua_util_unlink(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *fpath;
- int ret;
-
- fpath = luaL_checkstring(L, 1);
-
- if (fpath) {
- ret = unlink(fpath);
-
- if (ret == -1) {
- lua_pushboolean(L, false);
- lua_pushstring(L, strerror(errno));
-
- return 2;
- }
-
- lua_pushboolean(L, true);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
- static int
- lua_util_lock_file(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *fpath;
- int fd = -1;
- gboolean own = FALSE;
-
- #if !HAVE_FLOCK
- struct flock fl = {
- .l_type = F_WRLCK,
- .l_whence = SEEK_SET,
- .l_start = 0,
- .l_len = 0};
- #endif
-
- fpath = luaL_checkstring(L, 1);
-
- if (fpath) {
- if (lua_isnumber(L, 2)) {
- fd = lua_tointeger(L, 2);
- }
- else {
- fd = open(fpath, O_RDONLY);
- own = TRUE;
- }
-
- if (fd == -1) {
- lua_pushnil(L);
- lua_pushstring(L, strerror(errno));
-
- return 2;
- }
-
- #if HAVE_FLOCK
- if (flock(fd, LOCK_EX) == -1) {
- #else
- if (fcntl(fd, F_SETLKW, &fl) == -1) {
- #endif
- lua_pushnil(L);
- lua_pushstring(L, strerror(errno));
-
- if (own) {
- close(fd);
- }
-
- return 2;
- }
-
- lua_pushinteger(L, fd);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
- static int
- lua_util_unlock_file(lua_State *L)
- {
- LUA_TRACE_POINT;
- int fd = -1, ret, serrno;
- gboolean do_close = TRUE;
-
- #if !HAVE_FLOCK
- struct flock fl = {
- .l_type = F_UNLCK,
- .l_whence = SEEK_SET,
- .l_start = 0,
- .l_len = 0};
- #endif
-
- if (lua_isnumber(L, 1)) {
- fd = lua_tointeger(L, 1);
-
- if (lua_isboolean(L, 2)) {
- do_close = lua_toboolean(L, 2);
- }
-
- #if HAVE_FLOCK
- ret = flock(fd, LOCK_UN);
- #else
- ret = fcntl(fd, F_SETLKW, &fl);
- #endif
-
- if (do_close) {
- serrno = errno;
- close(fd);
- errno = serrno;
- }
-
- if (ret == -1) {
- lua_pushboolean(L, false);
- lua_pushstring(L, strerror(errno));
-
- return 2;
- }
-
- lua_pushboolean(L, true);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
- static int
- lua_util_create_file(lua_State *L)
- {
- LUA_TRACE_POINT;
- int fd, mode = 00644;
- const char *fpath;
-
- fpath = luaL_checkstring(L, 1);
-
- if (fpath) {
- if (lua_isnumber(L, 2)) {
- mode = lua_tointeger(L, 2);
- }
-
- fd = rspamd_file_xopen(fpath, O_RDWR | O_CREAT | O_TRUNC, mode, 0);
-
- if (fd == -1) {
- lua_pushnil(L);
- lua_pushstring(L, strerror(errno));
-
- return 2;
- }
-
- lua_pushinteger(L, fd);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
- static int
- lua_util_close_file(lua_State *L)
- {
- LUA_TRACE_POINT;
- int fd = -1;
-
- if (lua_isnumber(L, 1)) {
- fd = lua_tointeger(L, 1);
-
- if (close(fd) == -1) {
- lua_pushboolean(L, false);
- lua_pushstring(L, strerror(errno));
-
- return 2;
- }
-
- lua_pushboolean(L, true);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
- static int
- lua_util_random_hex(lua_State *L)
- {
- LUA_TRACE_POINT;
- char *buf;
- int buflen;
-
- buflen = lua_tointeger(L, 1);
-
- if (buflen <= 0) {
- return luaL_error(L, "invalid arguments");
- }
-
- buf = g_malloc(buflen);
- rspamd_random_hex(buf, buflen);
- lua_pushlstring(L, buf, buflen);
- g_free(buf);
-
- return 1;
- }
-
- static int
- lua_util_zstd_compress(lua_State *L)
- {
- return lua_compress_zstd_compress(L);
- }
-
- static int
- lua_util_zstd_decompress(lua_State *L)
- {
- return lua_compress_zstd_decompress(L);
- }
-
- static int
- lua_util_gzip_compress(lua_State *L)
- {
- return lua_compress_zlib_compress(L);
- }
-
- static int
- lua_util_gzip_decompress(lua_State *L)
- {
- return lua_compress_zlib_decompress(L, true);
- }
-
- static int
- lua_util_inflate(lua_State *L)
- {
- return lua_compress_zlib_decompress(L, false);
- }
-
- static int
- lua_util_normalize_prob(lua_State *L)
- {
- LUA_TRACE_POINT;
- double x, bias = 0.5;
-
- x = lua_tonumber(L, 1);
-
- if (lua_type(L, 2) == LUA_TNUMBER) {
- bias = lua_tonumber(L, 2);
- }
-
- lua_pushnumber(L, rspamd_normalize_probability(x, bias));
-
- return 1;
- }
-
- static int
- lua_util_caseless_hash(lua_State *L)
- {
- LUA_TRACE_POINT;
- uint64_t seed = 0xdeadbabe, h;
- struct rspamd_lua_text *t = NULL;
- int64_t *r;
-
- t = lua_check_text_or_string(L, 1);
-
- if (t == NULL || t->start == NULL) {
- return luaL_error(L, "invalid arguments");
- }
-
- if (lua_type(L, 2) == LUA_TNUMBER) {
- seed = lua_tointeger(L, 2);
- }
- else if (lua_type(L, 2) == LUA_TUSERDATA) {
- seed = lua_check_int64(L, 2);
- }
-
- h = rspamd_icase_hash(t->start, t->len, seed);
- r = lua_newuserdata(L, sizeof(*r));
- *r = h;
- rspamd_lua_setclass(L, rspamd_int64_classname, -1);
-
- return 1;
- }
-
- static int
- lua_util_caseless_hash_fast(lua_State *L)
- {
- LUA_TRACE_POINT;
- uint64_t seed = 0xdeadbabe, h;
- struct rspamd_lua_text *t = NULL;
- union {
- uint64_t i;
- double d;
- } u;
-
- t = lua_check_text_or_string(L, 1);
-
- if (t == NULL || t->start == NULL) {
- return luaL_error(L, "invalid arguments");
- }
-
- if (lua_type(L, 2) == LUA_TNUMBER) {
- seed = lua_tointeger(L, 2);
- }
- else if (lua_type(L, 2) == LUA_TUSERDATA) {
- seed = lua_check_int64(L, 2);
- }
-
- /*
- * Here, we loose entropy from 64 bits to 52 bits roughly, however,
- * it is still fine for practical applications
- */
-
- h = rspamd_icase_hash(t->start, t->len, seed);
- u.i = G_GUINT64_CONSTANT(0x3FF) << 52 | h >> 12;
- lua_pushnumber(L, u.d - 1.0);
-
- return 1;
- }
-
- static int
- lua_util_is_utf_spoofed(lua_State *L)
- {
- LUA_TRACE_POINT;
- gsize l1, l2;
- int ret, nres = 2;
- const char *s1 = lua_tolstring(L, 1, &l1),
- *s2 = lua_tolstring(L, 2, &l2);
- static USpoofChecker *spc, *spc_sgl;
- UErrorCode uc_err = U_ZERO_ERROR;
-
- if (s1 && s2) {
- if (spc == NULL) {
- spc = uspoof_open(&uc_err);
-
- if (uc_err != U_ZERO_ERROR) {
- msg_err("cannot init spoof checker: %s", u_errorName(uc_err));
- lua_pushboolean(L, false);
-
- return 1;
- }
- }
-
- ret = uspoof_areConfusableUTF8(spc, s1, l1, s2, l2, &uc_err);
- }
- else if (s1) {
- /* We have just s1, not s2 */
- if (spc_sgl == NULL) {
- spc_sgl = uspoof_open(&uc_err);
-
- if (uc_err != U_ZERO_ERROR) {
- msg_err("cannot init spoof checker: %s", u_errorName(uc_err));
- lua_pushboolean(L, false);
-
- return 1;
- }
-
- uspoof_setChecks(spc_sgl,
- USPOOF_INVISIBLE | USPOOF_MIXED_SCRIPT_CONFUSABLE | USPOOF_ANY_CASE,
- &uc_err);
- if (uc_err != U_ZERO_ERROR) {
- msg_err("Cannot set proper checks for uspoof: %s", u_errorName(uc_err));
- lua_pushboolean(L, false);
- uspoof_close(spc);
- return 1;
- }
- }
-
- ret = uspoof_checkUTF8(spc_sgl, s1, l1, NULL, &uc_err);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- lua_pushboolean(L, !!(ret != 0));
-
- switch (ret) {
- case 0:
- nres = 1;
- break;
- case USPOOF_SINGLE_SCRIPT_CONFUSABLE:
- lua_pushstring(L, "single");
- break;
- case USPOOF_MIXED_SCRIPT_CONFUSABLE:
- lua_pushstring(L, "multiple");
- break;
- case USPOOF_WHOLE_SCRIPT_CONFUSABLE:
- lua_pushstring(L, "whole");
- break;
- default:
- lua_pushstring(L, "unknown");
- break;
- }
-
- return nres;
- }
-
- static int
- lua_util_is_utf_mixed_script(lua_State *L)
- {
- LUA_TRACE_POINT;
- gsize len_of_string;
- const unsigned char *string_to_check = lua_tolstring(L, 1, &len_of_string);
- UScriptCode last_script_code = USCRIPT_INVALID_CODE;
- UErrorCode uc_err = U_ZERO_ERROR;
-
- if (string_to_check) {
- uint index = 0;
- UChar32 char_to_check = 0;
-
- while (index < len_of_string) {
- U8_NEXT(string_to_check, index, len_of_string, char_to_check);
-
- if (char_to_check < 0) {
- return luaL_error(L, "passed string is not valid utf");
- }
-
- UScriptCode current_script_code = uscript_getScript(char_to_check, &uc_err);
-
- if (uc_err != U_ZERO_ERROR) {
- msg_err("cannot get unicode script for character, error: %s",
- u_errorName(uc_err));
- lua_pushboolean(L, false);
-
- return 1;
- }
-
- if (current_script_code != USCRIPT_COMMON &&
- current_script_code != USCRIPT_INHERITED) {
-
- if (last_script_code == USCRIPT_INVALID_CODE) {
- last_script_code = current_script_code;
- }
- else {
- if (last_script_code != current_script_code) {
- lua_pushboolean(L, true);
-
- return 1;
- }
- }
- }
- }
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- lua_pushboolean(L, false);
-
- return 1;
- }
-
- static int
- lua_util_get_string_stats(lua_State *L)
- {
- LUA_TRACE_POINT;
- int num_of_digits = 0, num_of_letters = 0;
- struct rspamd_lua_text *t;
-
- t = lua_check_text_or_string(L, 1);
-
- if (t) {
- const char *p = t->start, *end = t->start + t->len;
- while (p < end) {
- if (g_ascii_isdigit(*p)) {
- num_of_digits++;
- }
- else if (g_ascii_isalpha(*p)) {
- num_of_letters++;
- }
- p++;
- }
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- lua_createtable(L, 0, 2);
- lua_pushstring(L, "digits");
- lua_pushinteger(L, num_of_digits);
- lua_settable(L, -3);
- lua_pushstring(L, "letters");
- lua_pushinteger(L, num_of_letters);
- lua_settable(L, -3);
-
- return 1;
- }
-
-
- static int
- lua_util_is_utf_outside_range(lua_State *L)
- {
- LUA_TRACE_POINT;
- int ret;
- struct rspamd_lua_text *t = lua_check_text_or_string(L, 1);
- uint32_t range_start = lua_tointeger(L, 2);
- uint32_t range_end = lua_tointeger(L, 3);
-
- static rspamd_lru_hash_t *validators;
-
- if (validators == NULL) {
- validators = rspamd_lru_hash_new_full(16, g_free, (GDestroyNotify) uspoof_close, g_int64_hash, g_int64_equal);
- }
-
- if (t) {
- uint64_t hash_key = (uint64_t) range_end << 32 || range_start;
-
- USpoofChecker *validator = rspamd_lru_hash_lookup(validators, &hash_key, 0);
-
- UErrorCode uc_err = U_ZERO_ERROR;
-
- if (validator == NULL) {
- USet *allowed_chars;
- uint64_t *creation_hash_key = g_malloc(sizeof(uint64_t));
- *creation_hash_key = hash_key;
-
- validator = uspoof_open(&uc_err);
- if (uc_err != U_ZERO_ERROR) {
- msg_err("cannot init spoof checker: %s", u_errorName(uc_err));
- lua_pushboolean(L, false);
- uspoof_close(validator);
- g_free(creation_hash_key);
- return 1;
- }
-
- allowed_chars = uset_openEmpty();
- uset_addRange(allowed_chars, range_start, range_end);
- uspoof_setAllowedChars(validator, allowed_chars, &uc_err);
-
- uspoof_setChecks(validator,
- USPOOF_CHAR_LIMIT | USPOOF_ANY_CASE, &uc_err);
-
- uset_close(allowed_chars);
-
- if (uc_err != U_ZERO_ERROR) {
- msg_err("Cannot configure uspoof: %s", u_errorName(uc_err));
- lua_pushboolean(L, false);
- uspoof_close(validator);
- g_free(creation_hash_key);
- return 1;
- }
-
- rspamd_lru_hash_insert(validators, creation_hash_key, validator,
- 0, 0);
- }
-
- int32_t pos = 0;
- ret = uspoof_checkUTF8(validator, t->start, t->len, &pos,
- &uc_err);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- lua_pushboolean(L, !!(ret != 0));
-
- return 1;
- }
-
-
- static int
- lua_util_get_hostname(lua_State *L)
- {
- LUA_TRACE_POINT;
- char *hostbuf;
- gsize hostlen;
-
- hostlen = sysconf(_SC_HOST_NAME_MAX);
-
- if (hostlen <= 0) {
- hostlen = 256;
- }
- else {
- hostlen++;
- }
-
- hostbuf = g_alloca(hostlen);
- memset(hostbuf, 0, hostlen);
- gethostname(hostbuf, hostlen - 1);
-
- lua_pushstring(L, hostbuf);
-
- return 1;
- }
-
- static int
- lua_util_parse_content_type(lua_State *L)
- {
- return lua_parsers_parse_content_type(L);
- }
-
-
- static int
- lua_util_mime_header_encode(lua_State *L)
- {
- LUA_TRACE_POINT;
- gsize len;
- const char *hdr = luaL_checklstring(L, 1, &len);
- char *encoded;
-
- if (!hdr) {
- return luaL_error(L, "invalid arguments");
- }
-
- encoded = rspamd_mime_header_encode(hdr, len);
- lua_pushstring(L, encoded);
- g_free(encoded);
-
- return 1;
- }
-
- static int
- lua_util_is_valid_utf8(lua_State *L)
- {
- LUA_TRACE_POINT;
- struct rspamd_lua_text *t = lua_check_text_or_string(L, 1);
-
- if (t) {
- goffset error_offset = rspamd_fast_utf8_validate(t->start, t->len);
-
- if (error_offset == 0) {
- lua_pushboolean(L, true);
- }
- else {
- lua_pushboolean(L, false);
- lua_pushinteger(L, error_offset);
-
- return 2;
- }
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
- static int
- lua_util_has_obscured_unicode(lua_State *L)
- {
- LUA_TRACE_POINT;
- int32_t i = 0, prev_i;
- UChar32 uc;
-
- struct rspamd_lua_text *t = lua_check_text_or_string(L, 1);
-
- while (i < t->len) {
- prev_i = i;
- U8_NEXT(t->start, i, t->len, uc);
-
- if (uc > 0) {
- if (IS_OBSCURED_CHAR(uc)) {
- lua_pushboolean(L, true);
- lua_pushinteger(L, uc); /* Character */
- lua_pushinteger(L, prev_i); /* Offset */
-
- return 3;
- }
- }
- }
-
- lua_pushboolean(L, false);
-
- return 1;
- }
-
- static int
- lua_util_readline(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *prompt = "";
- char *input = NULL;
-
- if (lua_type(L, 1) == LUA_TSTRING) {
- prompt = lua_tostring(L, 1);
- }
- #ifdef WITH_LUA_REPL
- static Replxx *rx_instance = NULL;
-
- if (rx_instance == NULL) {
- rx_instance = replxx_init();
- /* See https://github.com/AmokHuginnsson/replxx/issues/137 */
- replxx_history_add(rx_instance, "");
- }
-
- input = (char *) replxx_input(rx_instance, prompt);
-
- if (input) {
- lua_pushstring(L, input);
- }
- else {
- lua_pushnil(L);
- }
- #else
- size_t linecap = 0;
- ssize_t linelen;
-
- fprintf(stdout, "%s ", prompt);
-
- linelen = getline(&input, &linecap, stdin);
-
- if (linelen > 0) {
- if (input[linelen - 1] == '\n') {
- linelen--;
- }
-
- lua_pushlstring(L, input, linelen);
- free(input);
- }
- else {
- lua_pushnil(L);
- }
- #endif
-
- return 1;
- }
-
- static int
- lua_util_readpassphrase(lua_State *L)
- {
- LUA_TRACE_POINT;
- char test_password[8192];
- gsize r;
-
- r = rspamd_read_passphrase(test_password, sizeof(test_password), 0, NULL);
-
- if (r > 0) {
- lua_pushlstring(L, test_password, r);
- }
- else {
- lua_pushnil(L);
- }
-
- /* In fact, we still pass it to Lua which is not very safe */
- rspamd_explicit_memzero(test_password, sizeof(test_password));
-
- return 1;
- }
-
- static int
- lua_util_file_exists(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *fname = luaL_checkstring(L, 1);
- int serrno;
-
- if (fname) {
- if (access(fname, R_OK) == -1) {
- serrno = errno;
- lua_pushboolean(L, false);
- lua_pushstring(L, strerror(serrno));
- }
- else {
- lua_pushboolean(L, true);
- lua_pushnil(L);
- }
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 2;
- }
-
- static int
- lua_util_mkdir(lua_State *L)
- {
- LUA_TRACE_POINT;
- const char *dname = luaL_checkstring(L, 1);
- gboolean recursive = FALSE;
- int r = -1;
-
- if (dname) {
- if (lua_isboolean(L, 2)) {
- recursive = lua_toboolean(L, 2);
- }
-
- if (recursive) {
- char path[PATH_MAX];
- gsize len, i;
-
- len = rspamd_strlcpy(path, dname, sizeof(path));
-
- /* Strip last / */
- if (path[len - 1] == '/') {
- path[len - 1] = '\0';
- len--;
- }
-
- for (i = 1; i < len; i++) {
- if (path[i] == '/') {
- path[i] = '\0';
-
- errno = 0;
- r = mkdir(path, S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IXOTH);
-
- if (r == -1 && errno != EEXIST) {
- break;
- }
-
- path[i] = '/';
- }
- }
-
- /* Final path component */
- r = mkdir(path, S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IXOTH);
- }
- else {
- r = mkdir(dname, S_IRWXU | S_IRGRP | S_IXGRP | S_IROTH | S_IXOTH);
- }
-
- if (r == -1 && errno != EEXIST) {
- lua_pushboolean(L, false);
- lua_pushstring(L, strerror(errno));
-
- return 2;
- }
-
- lua_pushboolean(L, true);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- return 1;
- }
-
-
- static int
- lua_util_umask(lua_State *L)
- {
- LUA_TRACE_POINT;
- mode_t mask = 0, old;
-
- if (lua_type(L, 1) == LUA_TSTRING) {
- const char *str = lua_tostring(L, 1);
-
- if (str[0] == '0') {
- /* e.g. '022' */
- mask = strtol(str, NULL, 8);
- }
- else {
- /* XXX: implement modestring parsing at some point */
- return luaL_error(L, "invalid arguments");
- }
- }
- else if (lua_type(L, 1) == LUA_TNUMBER) {
- mask = lua_tointeger(L, 1);
- }
- else {
- return luaL_error(L, "invalid arguments");
- }
-
- old = umask(mask);
-
- lua_pushinteger(L, old);
-
- return 1;
- }
-
- static int
- lua_util_isatty(lua_State *L)
- {
- LUA_TRACE_POINT;
- if (isatty(STDOUT_FILENO)) {
- lua_pushboolean(L, true);
- }
- else {
- lua_pushboolean(L, false);
- }
-
- return 1;
- }
-
- /* Backport from Lua 5.3 */
-
- /******************************************************************************
- * Copyright (C) 1994-2016 Lua.org, PUC-Rio.
- *
- * Permission is hereby granted, free of charge, to any person obtaining
- * a copy of this software and associated documentation files (the
- * "Software"), to deal in the Software without restriction, including
- * without limitation the rights to use, copy, modify, merge, publish,
- * distribute, sublicense, and/or sell copies of the Software, and to
- * permit persons to whom the Software is furnished to do so, subject to
- * the following conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
- * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.
- * IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY
- * CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
- * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
- * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
- ******************************************************************************/
-
- /*
- ** {======================================================
- ** PACK/UNPACK
- ** =======================================================
- */
-
-
- /* value used for padding */
- #if !defined(LUA_PACKPADBYTE)
- #define LUA_PACKPADBYTE 0x00
- #endif
-
- /* maximum size for the binary representation of an integer */
- #define MAXINTSIZE 16
-
- /* number of bits in a character */
- #define NB CHAR_BIT
-
- /* mask for one character (NB 1's) */
- #define MC ((1 << NB) - 1)
-
- /* size of a lua_Integer */
- #define SZINT ((int) sizeof(lua_Integer))
-
- #define MAX_SIZET ((size_t) (~(size_t) 0))
-
- #define MAXSIZE \
- (sizeof(size_t) < sizeof(int) ? MAX_SIZET : (size_t) (INT_MAX))
-
-
- /* dummy union to get native endianness */
- static const union {
- int dummy;
- char little; /* true if machine is little endian */
- } nativeendian = {1};
-
-
- /* dummy structure to get native alignment requirements */
- struct cD {
- char c;
- union {
- double d;
- void *p;
- lua_Integer i;
- lua_Number n;
- } u;
- };
-
- #define MAXALIGN (offsetof(struct cD, u))
-
- /*
- ** Union for serializing floats
- */
- typedef union Ftypes {
- float f;
- double d;
- lua_Number n;
- char buff[5 * sizeof(lua_Number)]; /* enough for any float type */
- } Ftypes;
-
-
- /*
- ** information to pack/unpack stuff
- */
- typedef struct Header {
- lua_State *L;
- int islittle;
- int maxalign;
- } Header;
-
- /*
- ** options for pack/unpack
- */
- typedef enum KOption {
- Kint, /* signed integers */
- Kuint, /* unsigned integers */
- Kfloat, /* floating-point numbers */
- Kchar, /* fixed-length strings */
- Kstring, /* strings with prefixed length */
- Kzstr, /* zero-terminated strings */
- Kpadding, /* padding */
- Kpaddalign, /* padding for alignment */
- Knop /* no-op (configuration or spaces) */
- } KOption;
-
- #if LUA_VERSION_NUM <= 502
- #define lua_Unsigned size_t
- #endif
-
- #if LUA_VERSION_NUM < 502
-
- #define lua_Unsigned size_t
-
- typedef struct luaL_Buffer_53 {
- luaL_Buffer b; /* make incorrect code crash! */
- char *ptr;
- size_t nelems;
- size_t capacity;
- lua_State *L2;
- } luaL_Buffer_53;
-
- #define luaL_Buffer luaL_Buffer_53
- #define COMPAT53_PREFIX lua
- #undef COMPAT53_API
-
- #if defined(__GNUC__) || defined(__clang__)
- #define COMPAT53_API __attribute__((__unused__)) static
- #else
- #define COMPAT53_API static
- #endif
-
- #define COMPAT53_CONCAT_HELPER(a, b) a##b
- #define COMPAT53_CONCAT(a, b) COMPAT53_CONCAT_HELPER(a, b)
-
- #define luaL_buffinit COMPAT53_CONCAT(COMPAT53_PREFIX, _buffinit_53)
- COMPAT53_API void luaL_buffinit(lua_State *L, luaL_Buffer_53 *B);
- #define luaL_prepbuffsize COMPAT53_CONCAT(COMPAT53_PREFIX, _prepbufsize_53)
- COMPAT53_API char *luaL_prepbuffsize(luaL_Buffer_53 *B, size_t s);
- #define luaL_addlstring COMPAT53_CONCAT(COMPAT53_PREFIX, _addlstring_53)
- COMPAT53_API void luaL_addlstring(luaL_Buffer_53 *B, const char *s, size_t l);
- #define luaL_addvalue COMPAT53_CONCAT(COMPAT53_PREFIX, _addvalue_53)
- COMPAT53_API void luaL_addvalue(luaL_Buffer_53 *B);
- #define luaL_pushresult COMPAT53_CONCAT(COMPAT53_PREFIX, _pushresult_53)
- COMPAT53_API void luaL_pushresult(luaL_Buffer_53 *B);
- #undef luaL_buffinitsize
- #define luaL_buffinitsize(L, B, s) \
- (luaL_buffinit(L, B), luaL_prepbuffsize(B, s))
-
- #undef luaL_prepbuffer
- #define luaL_prepbuffer(B) \
- luaL_prepbuffsize(B, LUAL_BUFFERSIZE)
-
- #undef luaL_addchar
- #define luaL_addchar(B, c) \
- ((void) ((B)->nelems < (B)->capacity || luaL_prepbuffsize(B, 1)), \
- ((B)->ptr[(B)->nelems++] = (c)))
-
- #undef luaL_addsize
- #define luaL_addsize(B, s) \
- ((B)->nelems += (s))
-
- #undef luaL_addstring
- #define luaL_addstring(B, s) \
- luaL_addlstring(B, s, strlen(s))
-
- #undef luaL_pushresultsize
- #define luaL_pushresultsize(B, s) \
- (luaL_addsize(B, s), luaL_pushresult(B))
-
- COMPAT53_API void
- luaL_buffinit(lua_State *L, luaL_Buffer_53 *B)
- {
- /* make it crash if used via pointer to a 5.1-style luaL_Buffer */
- B->b.p = NULL;
- B->b.L = NULL;
- B->b.lvl = 0;
- /* reuse the buffer from the 5.1-style luaL_Buffer though! */
- B->ptr = B->b.buffer;
- B->nelems = 0;
- B->capacity = LUAL_BUFFERSIZE;
- B->L2 = L;
- }
-
-
- COMPAT53_API char *
- luaL_prepbuffsize(luaL_Buffer_53 *B, size_t s)
- {
- if (B->capacity - B->nelems < s) { /* needs to grow */
- char *newptr = NULL;
- size_t newcap = B->capacity * 2;
- if (newcap - B->nelems < s)
- newcap = B->nelems + s;
- if (newcap < B->capacity) /* overflow */
- luaL_error(B->L2, "buffer too large");
- newptr = (char *) lua_newuserdata(B->L2, newcap);
- memcpy(newptr, B->ptr, B->nelems);
- if (B->ptr != B->b.buffer) {
- lua_replace(B->L2, -2); /* remove old buffer */
- }
- B->ptr = newptr;
- B->capacity = newcap;
- }
- return B->ptr + B->nelems;
- }
-
-
- COMPAT53_API void
- luaL_addlstring(luaL_Buffer_53 *B, const char *s, size_t l)
- {
- memcpy(luaL_prepbuffsize(B, l), s, l);
- luaL_addsize(B, l);
- }
-
-
- COMPAT53_API void
- luaL_addvalue(luaL_Buffer_53 *B)
- {
- size_t len = 0;
- const char *s = lua_tolstring(B->L2, -1, &len);
- if (!s)
- luaL_error(B->L2, "cannot convert value to string");
- if (B->ptr != B->b.buffer) {
- lua_insert(B->L2, -2); /* userdata buffer must be at stack top */
- }
- luaL_addlstring(B, s, len);
- lua_remove(B->L2, B->ptr != B->b.buffer ? -2 : -1);
- }
-
-
- COMPAT53_API void
- luaL_pushresult(luaL_Buffer_53 *B)
- {
- lua_pushlstring(B->L2, B->ptr, B->nelems);
- if (B->ptr != B->b.buffer) {
- lua_replace(B->L2, -2); /* remove userdata buffer */
- }
- }
-
- #endif
-
- /*
- ** Read an integer numeral from string 'fmt' or return 'df' if
- ** there is no numeral
- */
- static int
- digit(int c)
- {
- return '0' <= c && c <= '9';
- }
-
- static int
- getnum(const char **fmt, int df)
- {
- if (!digit(**fmt)) /* no number? */
- return df; /* return default value */
- else {
- int a = 0;
- do {
- a = a * 10 + (*((*fmt)++) - '0');
- } while (digit(**fmt) && a <= ((int) MAXSIZE - 9) / 10);
- return a;
- }
- }
-
-
- /*
- ** Read an integer numeral and raises an error if it is larger
- ** than the maximum size for integers.
- */
- static int
- getnumlimit(Header *h, const char **fmt, int df)
- {
- int sz = getnum(fmt, df);
- if (sz > MAXINTSIZE || sz <= 0)
- luaL_error(h->L, "integral size (%d) out of limits [1,%d]",
- sz, MAXINTSIZE);
- return sz;
- }
-
-
- /*
- ** Initialize Header
- */
- static void
- initheader(lua_State *L, Header *h)
- {
- h->L = L;
- h->islittle = nativeendian.little;
- h->maxalign = 1;
- }
-
-
- /*
- ** Read and classify next option. 'size' is filled with option's size.
- */
- static KOption
- getoption(Header *h, const char **fmt, int *size)
- {
- int opt = *((*fmt)++);
- *size = 0; /* default */
- switch (opt) {
- case 'b':
- *size = sizeof(char);
- return Kint;
- case 'B':
- *size = sizeof(char);
- return Kuint;
- case 'h':
- *size = sizeof(short);
- return Kint;
- case 'H':
- *size = sizeof(short);
- return Kuint;
- case 'l':
- *size = sizeof(long);
- return Kint;
- case 'L':
- *size = sizeof(long);
- return Kuint;
- case 'j':
- *size = sizeof(lua_Integer);
- return Kint;
- case 'J':
- *size = sizeof(lua_Integer);
- return Kuint;
- case 'T':
- *size = sizeof(size_t);
- return Kuint;
- case 'f':
- *size = sizeof(float);
- return Kfloat;
- case 'd':
- *size = sizeof(double);
- return Kfloat;
- case 'n':
- *size = sizeof(lua_Number);
- return Kfloat;
- case 'i':
- *size = getnumlimit(h, fmt, sizeof(int));
- return Kint;
- case 'I':
- *size = getnumlimit(h, fmt, sizeof(int));
- return Kuint;
- case 's':
- *size = getnumlimit(h, fmt, sizeof(size_t));
- return Kstring;
- case 'c':
- *size = getnum(fmt, -1);
- if (*size == -1)
- luaL_error(h->L, "missing size for format option 'c'");
- return Kchar;
- case 'z':
- return Kzstr;
- case 'x':
- *size = 1;
- return Kpadding;
- case 'X':
- return Kpaddalign;
- case ' ':
- break;
- case '<':
- h->islittle = 1;
- break;
- case '>':
- h->islittle = 0;
- break;
- case '=':
- h->islittle = nativeendian.little;
- break;
- case '!':
- h->maxalign = getnumlimit(h, fmt, MAXALIGN);
- break;
- default:
- luaL_error(h->L, "invalid format option '%c'", opt);
- }
- return Knop;
- }
-
-
- /*
- ** Read, classify, and fill other details about the next option.
- ** 'psize' is filled with option's size, 'notoalign' with its
- ** alignment requirements.
- ** Local variable 'size' gets the size to be aligned. (Kpadal option
- ** always gets its full alignment, other options are limited by
- ** the maximum alignment ('maxalign'). Kchar option needs no alignment
- ** despite its size.
- */
- static KOption
- getdetails(Header *h, size_t totalsize,
- const char **fmt, int *psize, int *ntoalign)
- {
- KOption opt = getoption(h, fmt, psize);
- int align = *psize; /* usually, alignment follows size */
- if (opt == Kpaddalign) { /* 'X' gets alignment from following option */
- if (**fmt == '\0' || getoption(h, fmt, &align) == Kchar || align == 0)
- luaL_argerror(h->L, 1, "invalid next option for option 'X'");
- }
- if (align <= 1 || opt == Kchar) /* need no alignment? */
- *ntoalign = 0;
- else {
- if (align > h->maxalign) /* enforce maximum alignment */
- align = h->maxalign;
- if ((align & (align - 1)) != 0) /* is 'align' not a power of 2? */
- luaL_argerror(h->L, 1, "format asks for alignment not power of 2");
- *ntoalign = (align - (int) (totalsize & (align - 1))) & (align - 1);
- }
- return opt;
- }
-
-
- /*
- ** Pack integer 'n' with 'size' bytes and 'islittle' endianness.
- ** The final 'if' handles the case when 'size' is larger than
- ** the size of a Lua integer, correcting the extra sign-extension
- ** bytes if necessary (by default they would be zeros).
- */
- static void
- packint(luaL_Buffer *b, lua_Unsigned n,
- int islittle, int size, int neg)
- {
- char *buff = luaL_prepbuffsize(b, size);
- int i;
- buff[islittle ? 0 : size - 1] = (char) (n & MC); /* first byte */
- for (i = 1; i < size; i++) {
- n >>= NB;
- buff[islittle ? i : size - 1 - i] = (char) (n & MC);
- }
- if (neg && size > SZINT) { /* negative number need sign extension? */
- for (i = SZINT; i < size; i++) /* correct extra bytes */
- buff[islittle ? i : size - 1 - i] = (char) MC;
- }
- luaL_addsize(b, size); /* add result to buffer */
- }
-
-
- /*
- ** Copy 'size' bytes from 'src' to 'dest', correcting endianness if
- ** given 'islittle' is different from native endianness.
- */
- static void
- copywithendian(volatile char *dest, volatile const char *src,
- int size, int islittle)
- {
- if (islittle == nativeendian.little) {
- while (size-- != 0)
- *(dest++) = *(src++);
- }
- else {
- dest += size - 1;
- while (size-- != 0)
- *(dest--) = *(src++);
- }
- }
-
-
- static int
- lua_util_pack(lua_State *L)
- {
- luaL_Buffer b;
- Header h;
- const char *fmt = luaL_checkstring(L, 1); /* format string */
- int arg = 1; /* current argument to pack */
- size_t totalsize = 0; /* accumulate total size of result */
- initheader(L, &h);
- lua_pushnil(L); /* mark to separate arguments from string buffer */
- luaL_buffinit(L, &b);
-
- while (*fmt != '\0') {
- int size, ntoalign;
- KOption opt = getdetails(&h, totalsize, &fmt, &size, &ntoalign);
- totalsize += ntoalign + size;
- while (ntoalign-- > 0)
- luaL_addchar(&b, LUA_PACKPADBYTE); /* fill alignment */
- arg++;
- switch (opt) {
- case Kint: { /* signed integers */
- lua_Integer n = luaL_checkinteger(L, arg);
- if (size < SZINT) { /* need overflow check? */
- lua_Integer lim = (lua_Integer) 1 << ((size * NB) - 1);
- luaL_argcheck(L, -lim <= n && n < lim, arg, "integer overflow");
- }
- packint(&b, (lua_Unsigned) n, h.islittle, size, (n < 0));
- break;
- }
- case Kuint: { /* unsigned integers */
- lua_Integer n = luaL_checkinteger(L, arg);
- if (size < SZINT) /* need overflow check? */
- luaL_argcheck(L,
- (lua_Unsigned) n < ((lua_Unsigned) 1 << (size * NB)),
- arg,
- "unsigned overflow");
- packint(&b, (lua_Unsigned) n, h.islittle, size, 0);
- break;
- }
- case Kfloat: { /* floating-point options */
- volatile Ftypes u;
- char *buff = luaL_prepbuffsize(&b, size);
- lua_Number n = luaL_checknumber(L, arg); /* get argument */
- if (size == sizeof(u.f))
- u.f = (float) n; /* copy it into 'u' */
- else if (size == sizeof(u.d))
- u.d = (double) n;
- else
- u.n = n;
- /* move 'u' to final result, correcting endianness if needed */
- copywithendian(buff, u.buff, size, h.islittle);
- luaL_addsize(&b, size);
- break;
- }
- case Kchar: { /* fixed-size string */
- size_t len;
- const char *s = luaL_checklstring(L, arg, &len);
- if ((size_t) size <=
- len) /* string larger than (or equal to) needed? */
- luaL_addlstring(&b,
- s,
- size); /* truncate string to asked size */
- else { /* string smaller than needed */
- luaL_addlstring(&b, s, len); /* add it all */
- while (len++ < (size_t) size) /* pad extra space */
- luaL_addchar(&b, LUA_PACKPADBYTE);
- }
- break;
- }
- case Kstring: { /* strings with length count */
- size_t len;
- const char *s = luaL_checklstring(L, arg, &len);
- luaL_argcheck(L, size >= (int) sizeof(size_t) || len < ((size_t) 1 << (size * NB)),
- arg, "string length does not fit in given size");
- packint(&b,
- (lua_Unsigned) len,
- h.islittle,
- size,
- 0); /* pack length */
- luaL_addlstring(&b, s, len);
- totalsize += len;
- break;
- }
- case Kzstr: { /* zero-terminated string */
- size_t len;
- const char *s = luaL_checklstring(L, arg, &len);
- luaL_argcheck(L, strlen(s) == len, arg, "string contains zeros");
- luaL_addlstring(&b, s, len);
- luaL_addchar(&b, '\0'); /* add zero at the end */
- totalsize += len + 1;
- break;
- }
- case Kpadding:
- luaL_addchar(&b, LUA_PACKPADBYTE); /* FALLTHROUGH */
- case Kpaddalign:
- case Knop:
- arg--; /* undo increment */
- break;
- }
- }
- luaL_pushresult(&b);
- return 1;
- }
-
-
- static int
- lua_util_packsize(lua_State *L)
- {
- Header h;
- const char *fmt = luaL_checkstring(L, 1); /* format string */
- size_t totalsize = 0; /* accumulate total size of result */
- initheader(L, &h);
- while (*fmt != '\0') {
- int size, ntoalign;
- KOption opt = getdetails(&h, totalsize, &fmt, &size, &ntoalign);
- size += ntoalign; /* total space used by option */
- luaL_argcheck(L, totalsize <= MAXSIZE - size, 1,
- "format result too large");
- totalsize += size;
- switch (opt) {
- case Kstring: /* strings with length count */
- case Kzstr: /* zero-terminated string */
- luaL_argerror(L, 1, "variable-length format");
- /* call never return, but to avoid warnings: */ /* FALLTHROUGH */
- default:
- break;
- }
- }
- lua_pushinteger(L, (lua_Integer) totalsize);
- return 1;
- }
-
-
- /*
- ** Unpack an integer with 'size' bytes and 'islittle' endianness.
- ** If size is smaller than the size of a Lua integer and integer
- ** is signed, must do sign extension (propagating the sign to the
- ** higher bits); if size is larger than the size of a Lua integer,
- ** it must check the unread bytes to see whether they do not cause an
- ** overflow.
- */
- static lua_Integer
- unpackint(lua_State *L, const char *str,
- int islittle, int size, int issigned)
- {
- lua_Unsigned res = 0;
- int i;
- int limit = (size <= SZINT) ? size : SZINT;
- for (i = limit - 1; i >= 0; i--) {
- res <<= NB;
- res |= (lua_Unsigned) (unsigned char) str[islittle ? i : size - 1 - i];
- }
- if (size < SZINT) { /* real size smaller than lua_Integer? */
- if (issigned) { /* needs sign extension? */
- lua_Unsigned mask = (lua_Unsigned) 1 << (size * NB - 1);
- res = ((res ^ mask) - mask); /* do sign extension */
- }
- }
- else if (size > SZINT) { /* must check unread bytes */
- int mask = (!issigned || (lua_Integer) res >= 0) ? 0 : MC;
- for (i = limit; i < size; i++) {
- if ((unsigned char) str[islittle ? i : size - 1 - i] != mask)
- luaL_error(L,
- "%d-byte integer does not fit into Lua Integer",
- size);
- }
- }
- return (lua_Integer) res;
- }
-
- static lua_Integer
- posrelat(lua_Integer pos, size_t len)
- {
- if (pos >= 0)
- return pos;
- else if (0u - (size_t) pos > len)
- return 0;
- else
- return (lua_Integer) len + pos + 1;
- }
-
- static int
- lua_util_unpack(lua_State *L)
- {
- Header h;
- const char *fmt = luaL_checkstring(L, 1);
- size_t ld;
- const char *data;
- int n = 0; /* number of results */
-
- if (lua_type(L, 2) == LUA_TUSERDATA) {
- struct rspamd_lua_text *t = lua_check_text(L, 2);
-
- if (!t) {
- return luaL_error(L, "invalid arguments");
- }
-
- data = t->start;
- ld = t->len;
- }
- else {
- data = luaL_checklstring(L, 2, &ld);
- }
-
- size_t pos = (size_t) posrelat(luaL_optinteger(L, 3, 1), ld) - 1;
- luaL_argcheck(L, pos <= ld, 3, "initial position out of string");
-
- initheader(L, &h);
-
- while (*fmt != '\0') {
- int size, ntoalign;
- KOption opt = getdetails(&h, pos, &fmt, &size, &ntoalign);
- if ((size_t) ntoalign + size > ~pos || pos + ntoalign + size > ld)
- luaL_argerror(L, 2, "data string too short");
- pos += ntoalign; /* skip alignment */
- /* stack space for item + next position */
- luaL_checkstack(L, 2, "too many results");
- n++;
- switch (opt) {
- case Kint:
- case Kuint: {
- lua_Integer res = unpackint(L, data + pos, h.islittle, size,
- (opt == Kint));
- lua_pushinteger(L, res);
- break;
- }
- case Kfloat: {
- volatile Ftypes u;
- lua_Number num;
- copywithendian(u.buff, data + pos, size, h.islittle);
- if (size == sizeof(u.f))
- num = (lua_Number) u.f;
- else if (size == sizeof(u.d))
- num = (lua_Number) u.d;
- else
- num = u.n;
- lua_pushnumber(L, num);
- break;
- }
- case Kchar: {
- lua_pushlstring(L, data + pos, size);
- break;
- }
- case Kstring: {
- size_t len = (size_t) unpackint(L,
- data + pos,
- h.islittle,
- size,
- 0);
- luaL_argcheck(L,
- pos + len + size <= ld,
- 2,
- "data string too short");
- lua_pushlstring(L, data + pos + size, len);
- pos += len; /* skip string */
- break;
- }
- case Kzstr: {
- size_t len = (int) strlen(data + pos);
- lua_pushlstring(L, data + pos, len);
- pos += len + 1; /* skip string plus final '\0' */
- break;
- }
- case Kpaddalign:
- case Kpadding:
- case Knop:
- n--; /* undo increment */
- break;
- }
- pos += size;
- }
- lua_pushinteger(L, pos + 1); /* next position */
- return n + 1;
- }
-
- static int
- lua_util_btc_polymod(lua_State *L)
- {
- uint64_t c = 1;
-
- if (lua_type(L, 1) != LUA_TTABLE) {
- return luaL_error(L, "invalid arguments");
- }
-
- for (lua_pushnil(L); lua_next(L, 1); lua_pop(L, 1)) {
- uint8_t c0 = c >> 35;
- uint64_t d = lua_tointeger(L, -1);
-
- c = ((c & 0x07ffffffff) << 5) ^ d;
-
- if (c0 & 0x01) c ^= 0x98f2bc8e61;
- if (c0 & 0x02) c ^= 0x79b76d99e2;
- if (c0 & 0x04) c ^= 0xf33e5fb3c4;
- if (c0 & 0x08) c ^= 0xae2eabe2a8;
- if (c0 & 0x10) c ^= 0x1e4f43e470;
- }
-
- if ((c ^ 1) == 0) {
- lua_pushboolean(L, true);
- }
- else {
- lua_pushboolean(L, false);
- }
-
- return 1;
- }
-
- static int
- lua_util_parse_smtp_date(lua_State *L)
- {
- return lua_parsers_parse_smtp_date(L);
- }
-
-
- static int
- lua_load_util(lua_State *L)
- {
- lua_newtable(L);
- luaL_register(L, NULL, utillib_f);
-
- return 1;
- }
-
- static int
- lua_load_int64(lua_State *L)
- {
- lua_newtable(L);
- luaL_register(L, NULL, int64lib_f);
-
- return 1;
- }
-
-
- void luaopen_util(lua_State *L)
- {
- rspamd_lua_new_class(L, rspamd_ev_base_classname, ev_baselib_m);
- lua_pop(L, 1);
- rspamd_lua_new_class(L, rspamd_int64_classname, int64lib_m);
- lua_pop(L, 1);
- rspamd_lua_add_preload(L, "rspamd_util", lua_load_util);
- rspamd_lua_add_preload(L, "rspamd_int64", lua_load_int64);
- }
-
- static int
- lua_int64_tostring(lua_State *L)
- {
- int64_t n = lua_check_int64(L, 1);
- char buf[32];
- bool is_signed = false;
-
- if (lua_isboolean(L, 2)) {
- is_signed = lua_toboolean(L, 2);
- }
-
- if (is_signed) {
- rspamd_snprintf(buf, sizeof(buf), "%L", n);
- }
- else {
- rspamd_snprintf(buf, sizeof(buf), "%uL", n);
- }
- lua_pushstring(L, buf);
-
- return 1;
- }
-
- static int
- lua_int64_fromstring(lua_State *L)
- {
- struct rspamd_lua_text *t = lua_check_text_or_string(L, 1);
-
- if (t && t->len > 0) {
- uint64_t u64;
- const char *p = t->start;
- gsize len = t->len;
- bool neg = false;
-
- /*
- * We use complicated negation to allow both signed and unsinged values to
- * fit into result.
- * So we read int64 as unsigned and copy it to signed number.
- * If we wanted u64 this allows to have the same memory representation of
- * signed and unsigned.
- * If we wanted signed i64 we still can use -1000500 and it will be parsed
- * properly
- */
- if (*p == '-') {
- neg = true;
- p++;
- len--;
- }
- if (!rspamd_strtou64(p, len, &u64)) {
- lua_pushnil(L);
- lua_pushstring(L, "invalid number");
- return 2;
- }
-
- int64_t *i64_p = lua_newuserdata(L, sizeof(int64_t));
- rspamd_lua_setclass(L, rspamd_int64_classname, -1);
- memcpy(i64_p, &u64, sizeof(u64));
-
- if (neg) {
- *i64_p = -(*i64_p);
- }
- }
- else {
- }
-
- return 1;
- }
-
- static int
- lua_int64_tonumber(lua_State *L)
- {
- int64_t n = lua_check_int64(L, 1);
- double d;
-
- d = n;
- lua_pushinteger(L, d);
-
- return 1;
- }
-
- static int
- lua_int64_hex(lua_State *L)
- {
- int64_t n = lua_check_int64(L, 1);
- char buf[32];
-
- rspamd_snprintf(buf, sizeof(buf), "%XL", n);
- lua_pushstring(L, buf);
-
- return 1;
- }
-
- static int
- lua_ev_base_loop(lua_State *L)
- {
- int flags = 0;
- struct ev_loop *ev_base;
-
- ev_base = lua_check_ev_base(L, 1);
- if (lua_isnumber(L, 2)) {
- flags = lua_tointeger(L, 2);
- }
-
- int ret = ev_run(ev_base, flags);
- lua_pushinteger(L, ret);
-
- return 1;
- }
|