1 /** Lazy Substitution Algorithms.
2  *
3  * See_Also: http://forum.dlang.org/post/pymxzazxximtgixzbnpq@forum.dlang.org
4  */
5 module nxt.substitution;
6 
7 import std.range.primitives : isInputRange, ElementType;
8 import core.internal.traits : Unqual;
9 import std.typecons : Tuple;
10 import std.traits : isExpressionTuple;
11 import std.algorithm.searching : startsWith;
12 
13 import nxt.traits_ex : hasEvenLength, haveCommonType;
14 
15 import std.stdio;
16 
17 version(unittest)
18 {
19     import std.algorithm.comparison : equal;
20 }
21 
22 import std.traits : isExpressionTuple;
23 import nxt.traits_ex : haveCommonType;
24 
25 /** Similar to $(D among) but for set of replacements/substitutions $(D substs).
26  *
27  * Time-Complexity: O(1) thanks to D's $(D switch) guaranteeing O(1).
28  */
29 template substitute(substs...)
30 if ((substs.length & 1) == 0 && // need even number of elements (>= 1)
31     substs.length >= 2 && // and at least one replacement pair
32     isExpressionTuple!substs &&
33     haveCommonType!(substs))
34 {
35     Value substitute(Value)(Value value)
36     if (haveCommonType!(Value, substs)) // TODO: need static map incorrect
37     {
38         switch (value)
39         {
40             static foreach (i; 0 .. substs.length / 2)
41             {
42             case substs[2*i]:
43                 return substs[2*i + 1];
44             }
45         default:
46             return value;
47         }
48     }
49 }
50 
51 @safe pure nothrow unittest
52 {
53     auto xyz_abc__(T)(T value)
54     {
55         immutable a = "a";
56         const b = "b";
57         auto c = "c";
58         return value.substitute!("x", a,
59                                  "y", b,
60                                  "z", c);
61     }
62     assert(xyz_abc__("x") == "a");
63     assert(xyz_abc__("y") == "b");
64     assert(xyz_abc__("z") == "c");
65     assert(xyz_abc__("w") == "w");
66 }
67 
68 /** Substitute in parallel all elements in $(D r) which equal (according to $(D
69  * pred)) $(D ss[2*n]) with $(D ss[2*n + 1]) for $(D n) = 0, 1, 2, ....
70  */
71 auto substitute(alias pred = (a, b) => a == b, R, Ss...)(R r, Ss ss)
72 if (isInputRange!(Unqual!R) &&
73     Ss.length >= 2 &&
74     hasEvenLength!Ss &&
75     haveCommonType!(ElementType!R, Ss))
76 {
77     import std.algorithm.iteration : map;
78     import std.functional : binaryFun;
79     enum n = Ss.length / 2;
80     auto replaceElement(E)(E e)
81     {
82         static foreach (i; 0 .. n)
83         {
84             if (binaryFun!pred(e, ss[2*i]))
85             {
86                 return ss[2*i + 1];
87             }
88         }
89         return e;
90     }
91     return r.map!(a => replaceElement(a));
92 }
93 
94 ///
95 @safe pure unittest
96 {
97     import std.conv : to;
98     import std.algorithm : map;
99     auto x = `42`.substitute('2', '3')
100                  .substitute('3', '1');
101     static assert(is(ElementType!(typeof(x)) == dchar));
102     assert(equal(x, `41`));
103 }
104 
105 ///
106 @safe pure unittest
107 {
108     assert(`do_it`.substitute('_', ' ')
109                   .equal(`do it`));
110     int[3] x = [1, 2, 3];
111     auto y = x[].substitute(1, 0.1)
112                 .substitute(0.1, 0.2);
113     static assert(is(typeof(y.front) == double));
114     assert(y.equal([0.2, 2, 3]));
115     assert(`do_it`.substitute('_', ' ',
116                               'd', 'g',
117                               'i', 't',
118                               't', 'o')
119                   .equal(`go to`));
120     import std.range : retro;
121     assert(equal([1, 2, 3].substitute(1, 0.1)
122                           .retro,
123                  [3, 2, 0.1]));
124 }
125 
126 /** Substitute in parallel all elements in $(D r) which equal (according to $(D
127     pred)) $(D ss[2*n]) with $(D ss[2*n + 1]) for $(D n) = 0, 1, 2, ....
128 
129     Because $(D ss) are known at compile time, time-complexity for each element
130     substitution is O(1).
131 */
132 template substitute(ss...)
133 if (isExpressionTuple!ss &&
134     ss.length >= 2 &&
135     hasEvenLength!ss)
136 {
137     auto substitute(R)(R r)
138         if (isInputRange!(Unqual!R) &&
139             haveCommonType!(ElementType!R, ss))
140     {
141         import std.algorithm.iteration : map;
142         enum n = ss.length / 2;
143         auto replaceElement(E)(E e)
144         {
145             switch (e)
146             {
147                 static foreach (i; 0 .. n)
148                 {
149                 case ss[2*i]: return ss[2*i + 1];
150                 }
151             default: return e;
152             }
153         }
154         return r.map!(a => replaceElement(a));
155     }
156 }
157 
158 ///
159 @safe pure unittest
160 {
161     assert(`do_it`.substitute!('_', ' ')
162                   .equal(`do it`));
163     int[3] x = [1, 2, 3];
164     auto y = x[].substitute!(1, 0.1);
165     assert(y.equal([0.1, 2, 3]));
166     static assert(is(typeof(y.front) == double));
167     assert(`do_it`.substitute!('_', ' ',
168                                'd', 'g',
169                                'i', 't',
170                                't', 'o')
171                   .equal(`go to`));
172     import std.range : retro;
173     assert(equal([1, 2, 3].substitute!(1, 0.1)
174                           .retro,
175                  [3, 2, 0.1]));
176 }
177 
178 /** Helper range for subsequence overload of $(D substitute).
179  */
180 private auto substituteSplitter(alias pred = `a == b`, R, Rs...)(R haystack, Rs needles)
181 if (Rs.length >= 1 &&
182     is(typeof(startsWith!pred(haystack, needles))))
183 {
184     static struct Result
185     {
186         alias Hit = size_t; // 0 iff no hit, otherwise hit in needles[index-1]
187         alias E = Tuple!(R, Hit);
188         this(R haystack, Rs needles)
189         {
190             this._rest = haystack;
191             this._needles = needles;
192             popFront();
193         }
194 
195         @property auto ref front()
196         {
197             import std.range.primitives : empty;
198             return !_skip.empty ? E(_skip, 0) : E(_hit, _hitNr);
199         }
200 
201         import std.range.primitives : isInfinite;
202         static if (isInfinite!R)
203             enum empty = false; // propagate infiniteness
204         else
205             bool empty() const @property
206             {
207                 import std.range.primitives : empty;
208                 return _skip.empty && _hit.empty && _rest.empty;
209             }
210 
211         void popFront() @trusted
212         {
213             import std.range.primitives : empty;
214             if (!_skip.empty)
215             {
216                 _skip = R.init; // jump over _skip
217             }
218             else
219             {
220                 import std.algorithm.searching : find;
221 
222                 static if (_needles.length >= 2) // if variadic version
223                 {
224                     auto match = _rest.find!pred(_needles);
225                     auto hitValue = match[0];
226                     _hitNr = match[1];
227                 }
228                 else
229                 {
230                     auto match = _rest.find!pred(_needles);
231                     auto hitValue = match;
232                     _hitNr = !match.empty ? 1 : 0;
233                 }
234 
235                 if (_hitNr == 0) // no more hits
236                 {
237                     _skip = _rest;
238                     _hit = R.init;
239                     _rest = R.init;
240                 }
241                 else
242                 {
243                     import std.traits : isSomeString;
244                     static if (isSomeString!R)
245                     {
246                         size_t hitLength = size_t.max;
247                         final switch (_hitNr - 1)
248                         {
249                             foreach (const i, Ri; Rs)
250                             {
251                             case i: hitLength = _needles[i].length; break;
252                             }
253                         }
254                         assert(hitLength != size_t.max); // not needed if match returned bounded!int
255 
256                         if (_rest.ptr == hitValue.ptr) // match at start of _rest
257                         {
258                             _hit = hitValue[0 .. hitLength];
259                             _rest = hitValue[hitLength .. $];
260                         }
261                         else
262                         {
263                             _skip = _rest[0 .. hitValue.ptr - _rest.ptr];
264                             _hit = hitValue[0 .. hitLength];
265                             _rest = hitValue[hitLength .. $];
266                         }
267                     }
268                     else
269                     {
270                         static assert(0, `Handle R without slicing ` ~ R.stringof);
271                     }
272                 }
273             }
274         }
275     private:
276         R _rest;
277         Rs _needles;
278         R _skip; // skip before next hit
279         R _hit; // most recent (last) hit if any
280         size_t _hitNr; // hit number: 0 means no hit, otherwise index+1 to needles that matched
281     }
282     return Result(haystack, needles);
283 }
284 
285 @safe pure unittest
286 {
287     auto h = `alpha.beta.gamma`;
288     auto fs = h.substituteSplitter(`alpha`, `beta`, `gamma`);
289     alias FS = typeof(fs);
290     alias E = ElementType!FS;
291     static assert(is(E == Tuple!(string, ulong)));
292     assert(equal(fs, [E(`alpha`, 1),
293                       E(`.`, 0),
294                       E(`beta`, 2),
295                       E(`.`, 0),
296                       E(`gamma`, 3)]));
297 }
298 
299 @safe pure unittest
300 {
301     auto h = `.alpha.beta.gamma`;
302     auto fs = h.substituteSplitter(`alpha`, `beta`, `gamma`);
303     alias FS = typeof(fs);
304     alias E = ElementType!FS;
305     static assert(is(E == Tuple!(string, ulong)));
306     assert(equal(fs, [E(`.`, 0),
307                       E(`alpha`, 1),
308                       E(`.`, 0),
309                       E(`beta`, 2),
310                       E(`.`, 0),
311                       E(`gamma`, 3)]));
312 }
313 
314 @safe pure unittest
315 {
316     auto h = `alpha.beta.gamma.`;
317     auto fs = h.substituteSplitter(`alpha`, `beta`, `gamma`);
318     alias FS = typeof(fs);
319     alias E = ElementType!FS;
320     static assert(is(E == Tuple!(string, ulong)));
321     assert(equal(fs, [E(`alpha`, 1),
322                       E(`.`, 0),
323                       E(`beta`, 2),
324                       E(`.`, 0),
325                       E(`gamma`, 3),
326                       E(`.`, 0)]));
327 }
328 
329 @safe pure unittest
330 {
331     auto h = `alpha.alpha.alpha.`;
332     auto fs = h.substituteSplitter(`alpha`);
333     alias FS = typeof(fs);
334     alias E = ElementType!FS;
335     static assert(is(E == Tuple!(string, ulong)));
336     assert(equal(fs, [E(`alpha`, 1),
337                       E(`.`, 0),
338                       E(`alpha`, 1),
339                       E(`.`, 0),
340                       E(`alpha`, 1),
341                       E(`.`, 0)]));
342 }
343 
344 template Stride(size_t stride, size_t offset, Args...)
345 if (stride > 0)
346 {
347     import std.meta : AliasSeq;
348     static if (offset >= Args.length)
349     {
350         alias Stride = AliasSeq!();
351     }
352     else static if (stride >= Args.length)
353     {
354         alias Stride = AliasSeq!(Args[offset]);
355     }
356     else
357     {
358         alias Stride = AliasSeq!(Args[offset],
359                                  Stride!(stride, offset, Args[stride .. $]));
360     }
361 }
362 
363 /** Substitute in parallel all subsequences in $(D r) which equal (according to
364     $(D pred)) $(D ss[2*n]) with $(D ss[2*n + 1]) for $(D n) = 0, 1, 2, ....
365 */
366 auto substitute(alias pred = (a, b) => a == b, R, Ss...)(R r, Ss ss)
367 if (isInputRange!(Unqual!R) &&
368     Ss.length >= 2 &&
369     hasEvenLength!Ss &&
370     haveCommonType!(ElementType!R,
371                     ElementType!(Ss[0])))
372 {
373     import std.algorithm.iteration : map;
374     import std.functional : binaryFun;
375 
376     enum n = Ss.length / 2;
377 
378     auto replaceElement(E)(E e)
379     {
380         auto value = e[0];
381         const hitNr = e[1];
382         if (hitNr == 0) // not hit
383         {
384             return value;
385         }
386         else
387         {
388             static foreach (i; 0 .. n)
389             {
390                 if (hitNr == i + 1)
391                 {
392                     return ss[2*i + 1]; // replacement
393                 }
394             }
395             assert(false);
396         }
397     }
398 
399     // extract inputs
400     alias Ins = Stride!(2, 0, Ss);
401     Ins ins;
402     static foreach (i; 0 .. n)
403     {
404         ins[i] = ss[2*i];
405     }
406 
407     import std.algorithm.iteration : map, joiner;
408     return r.substituteSplitter!pred(ins)
409             .map!(a => replaceElement(a))
410             .joiner;
411 }
412 
413 @safe pure unittest
414 {
415     assert(`do_it now, sir`.substitute(`_`, ` `,
416                                        `d`, `g`,
417                                        `i`, `t`,
418                                        `t`, `o`,
419                                        `now`, `work`,
420                                        `sir`, `please`)
421                   .equal(`go to work, please`));
422 }
423 
424 @safe pure unittest
425 {
426     assert((`abcDe`.substitute(`a`, `AA`,
427                                `b`, `DD`)
428                    .substitute('A', 'y',
429                                'D', 'x',
430                                'e', '1'))
431            .equal(`yyxxcx1`));
432 }