From a3ea7982466941d746a09bafc8bf386711c48686 Mon Sep 17 00:00:00 2001 From: Martin Nordholts Date: Sat, 11 Dec 2021 14:00:45 +0100 Subject: [PATCH] Credit syntax definition and theme authors with new `--acknowledgements` option (#1971) The text that is printed is generated when building assets, by analyzing LICENSE and NOTICE files that comes with syntaxes and themes. We take this opportunity to also add a NOTICE file as defined by Apache License 2.0. --- CHANGELOG.md | 3 +- Cargo.lock | 2 + Cargo.toml | 4 +- NOTICE | 6 + assets/acknowledgements.bin | Bin 0 -> 9653 bytes assets/create.sh | 2 +- src/assets.rs | 10 + src/assets/build_assets.rs | 24 ++- src/assets/build_assets/acknowledgements.rs | 219 ++++++++++++++++++++ src/bin/bat/clap_app.rs | 12 ++ src/bin/bat/main.rs | 13 +- tests/integration_tests.rs | 37 ++++ 12 files changed, 325 insertions(+), 7 deletions(-) create mode 100644 NOTICE create mode 100644 assets/acknowledgements.bin create mode 100644 src/assets/build_assets/acknowledgements.rs diff --git a/CHANGELOG.md b/CHANGELOG.md index eecdd130..49e835d6 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -6,6 +6,7 @@ - Support for `--ignored-suffix` argument. See #1892 (@bojan88) - `$BAT_CONFIG_DIR` is now a recognized environment variable. It has precedence over `$XDG_CONFIG_HOME`, see #1727 (@billrisher) - Support for `x:+delta` syntax in line ranges (e.g. `20:+10`). See #1810 (@bojan88) +- Add new `--acknowledgements` option that gives credit to theme and syntax definition authors. See #1971 (@Enselic) ## Bugfixes @@ -47,7 +48,7 @@ ## `bat` as a library - Deprecate `HighlightingAssets::syntaxes()` and `HighlightingAssets::syntax_for_file_name()`. Use `HighlightingAssets::get_syntaxes()` and `HighlightingAssets::get_syntax_for_path()` instead. They return a `Result` which is needed for upcoming lazy-loading work to improve startup performance. They also return which `SyntaxSet` the returned `SyntaxReference` belongs to. See #1747, #1755, #1776, #1862 (@Enselic) -- Remove `HighlightingAssets::from_files` and `HighlightingAssets::save_to_cache`. Instead of calling the former and then the latter you now make a single call to `bat::assets::build`. See #1802 (@Enselic) +- Remove `HighlightingAssets::from_files` and `HighlightingAssets::save_to_cache`. Instead of calling the former and then the latter you now make a single call to `bat::assets::build`. See #1802, #1971 (@Enselic) - Replace the `error::Error(error::ErrorKind, _)` struct and enum with an `error::Error` enum. `Error(ErrorKind::UnknownSyntax, _)` becomes `Error::UnknownSyntax`, etc. Also remove the `error::ResultExt` trait. These changes stem from replacing `error-chain` with `thiserror`. See #1820 (@Enselic) - Add new `MappingTarget` enum variant `MapExtensionToUnknown`. Refer to its docummentation for more information. Clients are adviced to treat `MapExtensionToUnknown` the same as `MapToUnknown` in exhaustive matches. See #1703 (@cbolgiano) diff --git a/Cargo.lock b/Cargo.lock index 67eb0ecf..33d7fcfe 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -96,6 +96,7 @@ dependencies = [ "once_cell", "path_abs", "predicates", + "regex", "semver", "serde", "serde_yaml", @@ -106,6 +107,7 @@ dependencies = [ "thiserror", "unicode-width", "wait-timeout", + "walkdir", "wild", ] diff --git a/Cargo.toml b/Cargo.toml index 47f24849..22ea9ef1 100644 --- a/Cargo.toml +++ b/Cargo.toml @@ -34,7 +34,7 @@ minimal-application = [ git = ["git2"] # Support indicating git modifications paging = ["shell-words", "grep-cli"] # Support applying a pager on the output # Add "syntect/plist-load" when https://github.com/trishume/syntect/pull/345 reaches us -build-assets = ["syntect/yaml-load", "syntect/dump-create"] +build-assets = ["syntect/yaml-load", "syntect/dump-create", "regex", "walkdir"] # You need to use one of these if you depend on bat as a library: regex-onig = ["syntect/regex-onig"] # Use the "oniguruma" regex engine @@ -63,6 +63,8 @@ clircle = "0.3" bugreport = { version = "0.4", optional = true } dirs-next = { version = "2.0.0", optional = true } grep-cli = { version = "0.1.6", optional = true } +regex = { version = "1.0", optional = true } +walkdir = { version = "2.0", optional = true } [dependencies.git2] version = "0.13" diff --git a/NOTICE b/NOTICE new file mode 100644 index 00000000..97ff2fc8 --- /dev/null +++ b/NOTICE @@ -0,0 +1,6 @@ +Copyright (c) 2018-2021 bat-developers (https://github.com/sharkdp/bat). + +bat is made available under the terms of either the MIT License or the Apache +License 2.0, at your option. + +See the LICENSE-APACHE and LICENSE-MIT files for license details. diff --git a/assets/acknowledgements.bin b/assets/acknowledgements.bin new file mode 100644 index 0000000000000000000000000000000000000000..b3d31ea7145da0def788fcb7b70c50f6c0964e7d GIT binary patch literal 9653 zcmcJUWlUU+yX|L?K?iqtmnjaVxE6P(xI=Nb!HT z+;2BISy^kZ=ljmiFKc_Qof-JJtV<W!St(ISKo-@x zGBmJ1Q9yha zJj^jwB(tD3X%5Mi8}{{C@H{}a@=C!emr3uaYyzM zm*)eRIwOLyk>vP*j^j&$`Ao>o7vXR_+{50ciCiI{m*4Y7zL*nRH+du1rEMuv{yFcb z7^4LzIF5+u5lzzyQ__n?v&SQtOBhi>CEOtAi6Z7}xS={M86HncLeVcy1k(}}Ln5{a zxf6#o@~QGS6%;94M-=0UP6Q%8CW+Bep&?G&>UXI3PSrkL{-zg!0vRI|&VA`eM*dh@ zBI`vXl1vSP;Ng`p<~~mnTx^oyM}B1d{Bz(Zde8`oRpW>eh)+?AB~g}d@HK_2%KTkq zpWS(+Y`8*PBuUrArCdQ})Qu-{@{}14|BM)eb=}$QEGOSBEf&`@&DdpDg;#yqG|fb| zb;8h0aghfdQhc=clWeTZ6NvmPol3I)_QH^?Ad-{R>T)b+$k!khXGUwb$nIU5FZtgn zw_sQ*G!}({;?fBOvI>wR-e}UNF?ssI^9B+;Ayle5dDWB8ewjV`;zm;4uO^Y@?(uNPjU!GHJrMEX>(&16Xm+aFlKzM5_8$DqoiA6RIQhsXJaq%O zRWvYoL_C?`D-N)xBKCtE67k0}dG>v{HS!VFl6c|-aZ$8{M~<0qT+^|Ad@@>PEUX-9 zaD{U)smgS+Z~_#! z3{FHMmk0=w6=KNw34MJ)6s{kvW!tKyf4C1dAM&8S1frna`SS;wbHl%&%UX+7;S1;< zX1KOmG~lF3;Gy^LZ18t31OWXvg`a=7QOSbH!S{TB z$@36dWKZoxw!WBMPRBkQTYB=`4vhPEE4bcw_Ud7HzY>?O|BleMM3g!^sFfuZ#};9H zC4Tbt1pz|2PH)3DjU3%0!(9R6K4|LDcRbsRJggSo(#lA1C+JqZD`>H}WPe2JmS+4> zjlm*wnT1DQ?Cm*ehBf<(c{h0>Q?V!a9Y}smPb>+T!tPI4hz7bcvrxZp&&|R8OX&S` ze@Q3lBfiY34_=xScHGkO9wjNdo{?UkUg+;EO`l%cu{NxHMP^Cp zJanf*7j=2EbgIl7zQ>wZC2jT1*?b1P8`l@|ri*9yOU?+zx$Ww;1Q9mp5Sp#HZvqHs z28wQnty?E9BDn*Apt0nkk=nk0RS#r7M%JcWJ4h0*IE}9?NumI?J2DL4@I@r9BB#@+ zve8*-^-m8(MllJ01=4ACz+;M{g^rX;0iWkLdwJ19M0=?lsZ4SFJO`G-35<+m_c^5R zLswW<(nJMQQ%YrcXB{_>K{ztjAsoN#3h;q&A9~SgZQQA2>l2C^N_C$&#lyr2%6GE| z0eV*Gulga3@)(yK+I@UOIH1@d=Hy}{(1>h3*zZ#@rS7CdM3iDECl7R@%&6oZc5jsB zSz}nCd$)ZmGulmXvUY1lbm;PwLyLEcb-qJIGTrS^jWl;E)j2v>IbB7NnZk(0B9Nc4 z*AJe3kI#{5WRj=Ug*vGzn5%pB)aN#umwq!_==xyK&Kr8s&d-0EmE<||c6mGsS-Chb z@zP(#PmX@KcELhl&Cbr^DMcq<+9L0WKmHr>-QTR2H3(rt6DVpV1y=haLfqT|S zqEBbbZ{c6p#SeP5k&>LqggV-m#%7NO#0%^BgHe5_kj{#zb7rT^@Fo504E`bPA#C>< zduY<&^J4P!LdFjZni@$Z3zY=;_aFk#xmD7hyy`B_K&VvC20-5Wy?l-|AbJG`f(APQ z3moFp$tDFv@0&T10U>(XEK~i!l7qJc1wzgf+98RN`tmwt;%u4B?+t=Nx#W9jkbfc^ zPhCm=!ud47_Vyt9G!T2WpTq$9I=4vW9>Z?Z@<8Pt#cm?~K;`e_>jkXzLbtUdQ>5qt zQT9WOlEM|Jcp_G4bfuHitT}RodKj>F0jokt^mZt9tOLy$>td%P*EXJWxPSXA9Nit| zQg;p^W1fj)%vUgbS7I+odkinu!;F!?r<8wi1Pz-poO6g?CVy37`^{3EC{@c56UGc4d zF5wdRy4HI)s>mqN?&Qe-kKez!J7MmD$P>RIPEH+@{EwC}dBFP3(x{hK2igvdMscC# zv{3g|F*=E3>1^-4qpHKh0RewCrac=hdTXPf6qm~}^* zF1S=fYegBn!jxPxzZ#Ppb~ue>5#1+EQJhr}a-aDp8#trD_(&?UoMyT>;$kJN5V@-V zR4kz$oPE0caV`d`Q5LU1nD?hQ9&+{J)3NKs<%he{_0@Zj_0Jhbd)RQ{JJ>4=fHO#B zTVULoIcn)8)sTISEeGwne-rx zis?p!7}%73;|IfM2^^8d_h=Sa_;JxmCW6bbuty;3UlG&9szsjocc6UQ$@)*yP*eKRMZL};pc@S<=1(S5RL z(~$MJx}tgHcb41JWCnkz!Ah!y1zxK&2NWZbRQylS+84RbK@Q4|$uagzr4L&~k6*(Y zsG1rxZI1lb=6Juv+Ti#hjH^h{keiXS(j4i&i(W%Sbd=2APJ$XU{Gpo*Q0z4>9TA`W zeus3zvs4mME=`H7UT_QMo+NY>Yb!5VJ%Z=#R6kOPjNxJJeE~~!>8{NSDa}QJm0N?@ ztp}J`N%*R;fHP9JTpxkTMf3A*bw=hH3Aknhfx99Ns>(ZknW<)5lS?5On%5-1QzNcc zx2@c;|3ZLXq%5hJ#}36vRon{)&PaHUp5Q(>eLrNMYE3Napc&YJ-c#&-y z?f?xkIK50)Q*#~M0{_5F2MIA?O(>^hkc8fnFLoSQQNeZxU0{*uk?Sr#>uycu#(P^-~Yu*t%GrZgGr|Y46#-BF@%T5MY|xU#8E9R;4{GU%$iFw6sb8Z zQc(S|Jg?GIi7;>{zx>2a2es6{G_G@#X$3MpmahZoF^;)sywdb zuQ8|j(O{ge&9+x228G3jdSixL$E7@A-%Tyqi!b@8?*A>TjWAyrG9N?9cP>Sxh=anp$Gk&AP+Ew zK5w%;z28U*>j6n!N>&CfxcP5+2qZ}uzegC;{k>w~rcJw4=rWctyo9v6t@3epirk2m zrgrIItdc#q1$LnH|}oc8gM#3WvK7c~|l0hWzZwr|05d%NJGimmL952krkkP{AM zO@}*hw2pm~?G!n4rWKNC#9$H2=i65E_w;ruD7P6+BBj8f^X{ILU#Cy*Thax*6pquv zLI$QuszhtdYq*LsOp>07+Wk0RMW1$lS~m%nNtK$%P3}jusCNU4jCkUdHS&=u3lU*v z=QQ5a^Dn@}7EP+RG~7dft%~8GDH-K&;KrlX`C!sCz^kefMgHxF)9bB2B>WWF|>|FLWaww zoJ)9sq-*bMZf)V(1ei8Kj*awXP|LN2>a{vC4Q5W(1~Qa6^?btO$VL9yGWj8b#Y7X- zn2$rZsg{jQP4Dxiz!*y{@XsK$Y1*bDGJot7_Sc|8_U}$VPf977jkWn3It+SDNUWU{+fx^va;-2BQ==ZVC&nF zDA?T79fPa0GK|Q|%|e=Wh_)nEJZX8PC)#V!OKaEiQ|oCv}Geg$p? z3TPOOV|UA8od|s%IThDT6z*;4>ffvU?T+gyjG~I{lv9_+ZN}1bftAJ( zO5*wIsrr~o^8~dDLajH)Q@b1L&lMv>Qx3iAQ#1xlMds{YRu|2)z^pU+@^;z%o+IznG`V$< zUKy7`5{@cG4~%*gJh&uDJbUk(eip&AixH&Igc24a_Ql0Kl+xcmaaH%TDp@k4fxsi= zMU$weEPvrkp}E{3#J20vc^x1O@K>DOtmB`v8ALTuJ7P=RVmh&`#kkKN$rbxOWCr6< zYht{xL^Mobq;mgNXUa{U8itr26mMJsNoYZi`x;Lck9Yc1is+*D!-P44sUm1W(|L&* z-e~g5oE4s@;LsSI(7>6}riz=@BMS8C`+ajrv^u9|B}0Y-VT@kHWODT2BDf^{EQeV# zVy(ZL^|K*&V2qW9Jw98LgT~Ou8O&c(f8O(MqppAk!#Dcwm@Upg0P0o^0F0c zqJW=;9vCi*IlR@#$ixd#2i>I(NFAuT8Y_ED5uB+sC=dsGbQ7;_=y$N4<6&^+k`SZ( zF?X|0%*_%+M=b0_1%aPs<8huy%Ojbq*2x6$E@?&bRYW*KB<13AX+pBUtA0P@L^-Jq zBjW0^?<4S}o1C+nIi;PKyFES?UIcROZJz+LIzt@x-R3N8bdc;n-XKw2D(DHYGTJ?j z!t~GoiKjjyHBHYmjGQ|XQ926?SdvN7;q4^0TZO?X?h1NvaVtU36+n2#KB{L5-C8QJ zmx60fbzsJqANSV;yO9q^Dh9h@FZvU0q%{qGSTS5y$fAs^IJbyaQ}gd^6xd)r>@(O` z*D9Jj)aIeU3+MlZ+MXMA7>0hvNpXJgXlj+`o+;5%=T#zc*36_!U~C2)>JCv9j}%Zg zlhO%wbBCtLC7DMe6qsaQ;>J4bAA`|Y*mD3=Rl-t8(FoYBFuoW z`_1DNsSONpXSOWpKRDLTmh`_DA07rjb=Ba&-yTbEhvNtk{Xl)jH2=}(nz4%%@@p$~ zE-WOs=?pf9!(y}`USNp~sJmtaZJAjW^7UOOK`KK-nCV>_8wJG$i$F~(#E{B*7{0QB z_FM}=`Ll>St10Fzh=YzvnABj>}?1!%*C;-71rg zqY@xIV&LAoNoPA0x|SedBRZHA8GVcU90+GcmEI3-^P&X?Sce}F{DvzE5;gqwUB`YQ zRXKZF#jPgl)Vua_$uVnIZ1{#o#ZdX$bt&j<&jr5Io(V|_aAFmr&XG)4r|zH}YH>4_MGp#U3&%rTNEHIBIWQ zu+~i>Hmj4Fr1-}iy)Tj@5f$B16jesaLvoplxRT`KetGWa19Qs3FiwIf^-N;DefePV%0y-d=k8vH673f)&$#VIj1 zVy+$*lJlw=-Sw@rs>I`U44`}O6OpS_Q^#AMn_C>RI-O zc1wIybd&G2yr1fdlk+2_wbYs`U*6-YcUdZ!d-~#=r`WUa2QxDZ8$MS@GK=fAm(|E4 zFNl9+>1H#MyvVe8EpEejwD*Kw{^>Ulg#M5<97MF0m7hwDN-S?@n>ajHdN_utX=Mmj zbq*i@&F-51C%QozpA!XuD*ZxPWSI0*z>FHeZayh%7QoV5Q z(dr$t^}ZVVG-=t)z2C9oMpKU5f959R=N>FSF17b5s`TOo$X)NLhJU6+OzkHMq;^O z>Bl@;kHg6!B}(+C6~X>it-7VbgF6`9 zpfcwa^rvrl;ZT{n0gcgwK3vaa&%tr8L;iud7kH{OPfC!;Cj0LJcewN(H{b6dqN_OP zlz#UzCn4m8ACxt{-?10MNkwB^zI1@z2 zZ2n{Ofem5)&abN8rIlOe^EhIMH$D@7@ox*c%s64mR#BSkb+iA0COof3_9wl72XOAF zqK2Y!vzN(|P)y-mN{Xk-M#kFgN*0_H?ZyZR+@X?fX<)?nvqrMhEh{%1Gx0Hf?AG1^ z3b)Un7j*=6h)0VAU1nBzV2(x$0tun~NxtJ0Bz}MPbAusyZMiNLK*drj7;RJJ!juRd zGQ>*KLMaFUZY2^ld=b9LBPoNRr0xd5;ff(fdkMs9Lc&OW(9_;_0HUP1Pfad2=Yha` z{XOq4v)za38Go@y%>+u72~|jb=Jd{ni}*<5)4{sn6ud#59F_z@_Q50z#!ZM_R+; z3c+?n_Cd%9$}B1shHx0szslq;yVC1=^&qEd3ChyNv4S;wL2ZkQmgG$zl^Z>TTNO09 z37;%vZJoQb#(P!XB*o=yQl{a2xL7TnFvN!C%eWWDSxEIa1x-s$v zvcjWu1x3^twe8}{^VTwUcoY_Na`yy&w%Xjyi8D>>xN-XB3|76?P}e?b{G*rMmmA6u z_F(ZjEQ{dgDPAyim=cfgy=)+QH|h4_g(%msc7pb&hoyJsoNnj_u*r)#(jG@=oU@<| z@tWQ&lg6PfWC~GdIX{tk*y+BMs{5KIDrBh0yn zF``S)$qjo4!v|D{5iFvW59IB^%}JTn%4X z{V<{mj&_+z{mjXg5Y02}wiCDpB=Am@4}{NIpBi+rZKx9Gd(zL&CvVhI8$E10meFc^ zoLinvA}Ww;I?z^EoET~)*-N#%hO6Jc6WhexoXbdde}NFlGF3Nz)2c+u;@rae;R3y)-_HMblm_H3 zlz!5@ywJKri6M@IE*DmIJB#7aOME!t_}Q{u@HgJp;E5v00DoGvOJXw&Kt|8uNCo>( z^b7RhT)#YAuTt*IdZhuatD;$bC2>qqK4CV+vId}7wircufUh2dtI`a+Qs>J(6ZE0w z11o)Rx^5pzJ=@}liZV|YJenHkPxtcTKqk~%p);{F&axuaJ&;XJL#rM#QLP}zciOL6 zf7u`n>B1Ne4BjqU*lgd4hHG>MZEBzv$Y-hn#TcW}?$ zP$89Pke=G+1`s4oG!kjsgEj6BzgML1P1imMSlV0gJtH^MLVr(Y$al#-B;#uaWaACP zwKxpIcKHjD{#*I7D1wxMV7-LBh#Rx{9xuAgV;HY=Zw9F6*kQMQ3uNXQN?%r zqvs-TU3q^r*ccw)p{3_~uWLk1e1))CaFwuCaFw=Aa22ydaFw;|%{_wU7zeUolP4PF zvg)~KYUxjryb=HT?lnPmT#P3}x$(iw{S`$9^ZMt$sfrz_bQg#Dp0E%n;A@)xIi5BI z-@~IPs4g-Gh@$DW4z5)nG|H9+M6JNEpuvvALI-IQ1l|MiRDe-8h(?%MJv)LV+96<; zDO0GV9YU%sQFIgoAI;Dw!K2!0wl;>fZ;TUnI*wuhTlUJ%+WP_#i&VU{!o5G$#`~7q zb!KD$(`uMm6leDxj&#VI7$CAHV`}W^GyBVrUxLSkYPB1H4nK@2yCzeA!p^gAyO>gT zn>rf*D@w;%ibA!Q|!d(e&t72j6Io#Df4i6b1w?69YtyCdu@iBx{H`ycEH5jr=ZI&4p(?4ulM^E<>j*g7q%3ex^D76oVh}kQSE2 zkQT=>Dh3UYD>HkRr23vu{rqbrFs|maJ*d4nfNpb~*m7>KX_fRH9%5d7Yu|a^SAgbj zjOfy!w0TU5?xOPm3?Q(|=~ilbVPYZa9nA^BKFxfP5sAA>Tk5Mm5^>aCvgwnHy+ zn!sWWe@oCmS^vYDY-f1{Tm^zeV^W!uQ}f6|Mb z3xMMP&qD$UNWHni(Vuwe-d}V=l||@YV-RVF4@A+oYha~hN=K4e)@cQ zb4A#LHCH)L>>b>@%D6KFWVzs1h96o9(OPdzel!tDgtf8mVZ+)1G@A8JI%3NJ literal 0 HcmV?d00001 diff --git a/assets/create.sh b/assets/create.sh index 65533934..103fdb76 100755 --- a/assets/create.sh +++ b/assets/create.sh @@ -53,7 +53,7 @@ bat cache --clear done ) -bat cache --build --blank --source="$ASSET_DIR" --target="$ASSET_DIR" +bat cache --build --blank --acknowledgements --source="$ASSET_DIR" --target="$ASSET_DIR" ( cd "$ASSET_DIR" diff --git a/src/assets.rs b/src/assets.rs index ec80c1ea..9ef66b95 100644 --- a/src/assets.rs +++ b/src/assets.rs @@ -55,6 +55,9 @@ pub(crate) const COMPRESS_THEMES: bool = false; /// performance due to lazy-loading pub(crate) const COMPRESS_LAZY_THEMES: bool = true; +/// Compress for size of ~10 kB instead of ~120 kB +pub(crate) const COMPRESS_ACKNOWLEDGEMENTS: bool = true; + impl HighlightingAssets { fn new(serialized_syntax_set: SerializedSyntaxSet, theme_set: LazyThemeSet) -> Self { HighlightingAssets { @@ -305,6 +308,13 @@ pub(crate) fn get_integrated_themeset() -> LazyThemeSet { from_binary(include_bytes!("../assets/themes.bin"), COMPRESS_THEMES) } +pub fn get_acknowledgements() -> String { + from_binary( + include_bytes!("../assets/acknowledgements.bin"), + COMPRESS_ACKNOWLEDGEMENTS, + ) +} + pub(crate) fn from_binary(v: &[u8], compressed: bool) -> T { asset_from_contents(v, "n/a", compressed) .expect("data integrated in binary is never faulty, but make sure `compressed` is in sync!") diff --git a/src/assets/build_assets.rs b/src/assets/build_assets.rs index fe78f2b1..f3448679 100644 --- a/src/assets/build_assets.rs +++ b/src/assets/build_assets.rs @@ -5,10 +5,14 @@ use syntect::highlighting::ThemeSet; use syntect::parsing::{SyntaxSet, SyntaxSetBuilder}; use crate::assets::*; +use acknowledgements::build_acknowledgements; + +mod acknowledgements; pub fn build( source_dir: &Path, include_integrated_assets: bool, + include_acknowledgements: bool, target_dir: &Path, current_version: &str, ) -> Result<()> { @@ -18,9 +22,17 @@ pub fn build( let syntax_set = syntax_set_builder.build(); + let acknowledgements = build_acknowledgements(source_dir, include_acknowledgements)?; + print_unlinked_contexts(&syntax_set); - write_assets(&theme_set, &syntax_set, target_dir, current_version) + write_assets( + &theme_set, + &syntax_set, + &acknowledgements, + target_dir, + current_version, + ) } fn build_theme_set(source_dir: &Path, include_integrated_assets: bool) -> Result { @@ -89,6 +101,7 @@ fn print_unlinked_contexts(syntax_set: &SyntaxSet) { fn write_assets( theme_set: &LazyThemeSet, syntax_set: &SyntaxSet, + acknowledgements: &Option, target_dir: &Path, current_version: &str, ) -> Result<()> { @@ -106,6 +119,15 @@ fn write_assets( COMPRESS_SYNTAXES, )?; + if let Some(acknowledgements) = acknowledgements { + asset_to_cache( + acknowledgements, + &target_dir.join("acknowledgements.bin"), + "acknowledgements", + COMPRESS_ACKNOWLEDGEMENTS, + )?; + } + print!( "Writing metadata to folder {} ... ", target_dir.to_string_lossy() diff --git a/src/assets/build_assets/acknowledgements.rs b/src/assets/build_assets/acknowledgements.rs new file mode 100644 index 00000000..742e3791 --- /dev/null +++ b/src/assets/build_assets/acknowledgements.rs @@ -0,0 +1,219 @@ +use std::fs::read_to_string; +use std::path::{Path, PathBuf}; + +use walkdir::DirEntry; + +use crate::error::*; + +struct PathAndStem { + path: PathBuf, + stem: String, + relative_path: String, +} + +/// Looks for LICENSE and NOTICE files in `source_dir`, does some rudimentary +/// analysis, and compiles them together in a single string that is meant to be +/// used in the output to `--acknowledgements` +pub fn build_acknowledgements( + source_dir: &Path, + include_acknowledgements: bool, +) -> Result> { + if !include_acknowledgements { + return Ok(None); + } + + let mut acknowledgements = format!("{}\n\n", include_str!("../../../NOTICE")); + + // Sort entries so the order is stable over time + let entries = walkdir::WalkDir::new(source_dir).sort_by(|a, b| a.path().cmp(b.path())); + for path_and_stem in entries + .into_iter() + .flatten() + .flat_map(|entry| to_path_and_stem(source_dir, entry)) + { + if let Some(license_text) = handle_file(&path_and_stem)? { + append_to_acknowledgements( + &mut acknowledgements, + &path_and_stem.relative_path, + &license_text, + ) + } + } + + Ok(Some(acknowledgements)) +} + +fn to_path_and_stem(source_dir: &Path, entry: DirEntry) -> Option { + let path = entry.path(); + + Some(PathAndStem { + path: path.to_owned(), + stem: path.file_stem().map(|s| s.to_string_lossy().to_string())?, + relative_path: path + .strip_prefix(source_dir) + .map(|p| p.to_string_lossy().to_string()) + .ok()?, + }) +} + +fn handle_file(path_and_stem: &PathAndStem) -> Result> { + if path_and_stem.stem == "NOTICE" { + handle_notice(&path_and_stem.path) + } else if path_and_stem.stem.to_ascii_uppercase() == "LICENSE" { + handle_license(&path_and_stem.path) + } else { + Ok(None) + } +} + +fn handle_notice(path: &Path) -> Result> { + // Assume NOTICE as defined by Apache License 2.0. These must be part of acknowledgements. + Ok(Some(read_to_string(path)?)) +} + +fn handle_license(path: &Path) -> Result> { + let license_text = read_to_string(path)?; + + if include_license_in_acknowledgments(&license_text) { + Ok(Some(license_text)) + } else if license_not_needed_in_acknowledgements(&license_text) { + Ok(None) + } else { + Err(format!("ERROR: License is of unknown type: {:?}", path).into()) + } +} + +fn include_license_in_acknowledgments(license_text: &str) -> bool { + let markers = vec![ + // MIT + "The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.", + + // BSD + "Redistributions in binary form must reproduce the above copyright notice,", + + // Apache 2.0 + "Apache License Version 2.0, January 2004 http://www.apache.org/licenses/", + "Licensed under the Apache License, Version 2.0 (the \"License\");", + ]; + + license_contains_marker(license_text, &markers) +} + +fn license_not_needed_in_acknowledgements(license_text: &str) -> bool { + let markers = vec![ + // Public domain + "This is free and unencumbered software released into the public domain.", + + // Special license of assets/syntaxes/01_Packages/LICENSE + "Permission to copy, use, modify, sell and distribute this software is granted. This software is provided \"as is\" without express or implied warranty, and with no claim as to its suitability for any purpose." + ]; + + license_contains_marker(license_text, &markers) +} + +fn license_contains_marker(license_text: &str, markers: &[&str]) -> bool { + let normalized_license_text = normalize_license_text(license_text); + markers.iter().any(|m| normalized_license_text.contains(m)) +} + +fn append_to_acknowledgements( + acknowledgements: &mut String, + relative_path: &str, + license_text: &str, +) { + acknowledgements.push_str(&format!("## {}\n\n{}", relative_path, license_text)); + + // Make sure the last char is a newline to not mess up formatting later + if acknowledgements + .chars() + .last() + .expect("acknowledgements is not the empty string") + != '\n' + { + acknowledgements.push('\n'); + } + + // Add two more newlines to make it easy to distinguish where this text ends + // and the next starts + acknowledgements.push_str("\n\n"); +} + +/// Replaces newlines with a space character, and replaces multiple spaces with one space. +/// This makes the text easier to analyze. +fn normalize_license_text(license_text: &str) -> String { + use regex::Regex; + + let whitespace_and_newlines = Regex::new(r"\s").unwrap(); + let as_single_line = whitespace_and_newlines.replace_all(license_text, " "); + + let many_spaces = Regex::new(" +").unwrap(); + many_spaces.replace_all(&as_single_line, " ").to_string() +} + +#[cfg(test)] +mod tests { + #[cfg(test)] + use super::*; + + #[test] + fn test_normalize_license_text() { + let license_text = "This is a license text with these terms: + * Complicated multi-line + term with indentation"; + + assert_eq!( + "This is a license text with these terms: * Complicated multi-line term with indentation".to_owned(), + normalize_license_text(license_text), + ); + } + + #[test] + fn test_normalize_license_text_with_windows_line_endings() { + let license_text = "This license text includes windows line endings\r +and we need to handle that."; + + assert_eq!( + "This license text includes windows line endings and we need to handle that." + .to_owned(), + normalize_license_text(license_text), + ); + } + + #[test] + fn test_append_to_acknowledgements_adds_newline_if_missing() { + let mut acknowledgements = "preamble\n\n\n".to_owned(); + + append_to_acknowledgements(&mut acknowledgements, "some/path", "line without newline"); + assert_eq!( + "preamble + + +## some/path + +line without newline + + +", + acknowledgements + ); + + append_to_acknowledgements(&mut acknowledgements, "another/path", "line with newline\n"); + assert_eq!( + "preamble + + +## some/path + +line without newline + + +## another/path + +line with newline + + +", + acknowledgements + ); + } +} diff --git a/src/bin/bat/clap_app.rs b/src/bin/bat/clap_app.rs index 1a618bb2..94ddce55 100644 --- a/src/bin/bat/clap_app.rs +++ b/src/bin/bat/clap_app.rs @@ -508,6 +508,12 @@ pub fn build_app(interactive_output: bool) -> ClapApp<'static, 'static> { .hidden_short_help(true) .help("Show diagnostic information for bug reports.") ) + .arg( + Arg::with_name("acknowledgements") + .long("acknowledgements") + .hidden_short_help(true) + .help("Show acknowledgements."), + ) .arg( Arg::with_name("ignored-suffix") .number_of_values(1) @@ -578,6 +584,12 @@ pub fn build_app(interactive_output: bool) -> ClapApp<'static, 'static> { "Create completely new syntax and theme sets \ (instead of appending to the default sets).", ), + ) + .arg( + Arg::with_name("acknowledgements") + .long("acknowledgements") + .requires("build") + .help("Build acknowledgements.bin."), ), ) } diff --git a/src/bin/bat/main.rs b/src/bin/bat/main.rs index d4ce33d9..2d9f3164 100644 --- a/src/bin/bat/main.rs +++ b/src/bin/bat/main.rs @@ -47,9 +47,13 @@ fn build_assets(matches: &clap::ArgMatches) -> Result<()> { .map(Path::new) .unwrap_or_else(|| PROJECT_DIRS.cache_dir()); - let blank = matches.is_present("blank"); - - bat::assets::build(source_dir, !blank, target_dir, clap::crate_version!()) + bat::assets::build( + source_dir, + !matches.is_present("blank"), + matches.is_present("acknowledgements"), + target_dir, + clap::crate_version!(), + ) } fn run_cache_subcommand(matches: &clap::ArgMatches) -> Result<()> { @@ -324,6 +328,9 @@ fn run() -> Result { } else if app.matches.is_present("cache-dir") { writeln!(io::stdout(), "{}", cache_dir())?; Ok(true) + } else if app.matches.is_present("acknowledgements") { + writeln!(io::stdout(), "{}", bat::assets::get_acknowledgements())?; + Ok(true) } else { run_controller(inputs, &config) } diff --git a/tests/integration_tests.rs b/tests/integration_tests.rs index 986d9952..5648f252 100644 --- a/tests/integration_tests.rs +++ b/tests/integration_tests.rs @@ -1,4 +1,5 @@ use assert_cmd::cargo::CommandCargoExt; +use predicates::boolean::PredicateBooleanExt; use predicates::{prelude::predicate, str::PredicateStrExt}; use serial_test::serial; use std::path::Path; @@ -1275,3 +1276,39 @@ fn ignored_suffix_arg() { .stdout("\u{1b}[38;5;231m{\"test\": \"value\"}\u{1b}[0m") .stderr(""); } + +#[test] +fn acknowledgements() { + bat() + .arg("--acknowledgements") + .assert() + .success() + .stdout( + // Just some sanity checking that avoids names of persons, except our own Keith Hall :) + predicate::str::contains( + "Copyright (c) 2018-2021 bat-developers (https://github.com/sharkdp/bat).", + ) + .and(predicate::str::contains( + "Copyright (c) 2012-2020 The Sublime CMake authors", + )) + .and(predicate::str::contains( + "Copyright 2014-2015 SaltStack Team", + )) + .and(predicate::str::contains( + "Copyright (c) 2013-present Dracula Theme", + )) + .and(predicate::str::contains( + "## syntaxes/01_Packages/Rust/LICENSE.txt", + )) + .and(predicate::str::contains( + "## syntaxes/02_Extra/http-request-response/LICENSE", + )) + .and(predicate::str::contains( + "## themes/dracula-sublime/LICENSE", + )) + .and(predicate::str::contains("Copyright (c) 2017 b123400")) + .and(predicate::str::contains("Copyright (c) 2021 Keith Hall")) + .and(predicate::str::contains("Copyright 2014 Clams")), + ) + .stderr(""); +}