001/*
002 * Licensed to the Apache Software Foundation (ASF) under one or more
003 * contributor license agreements.  See the NOTICE file distributed with
004 * this work for additional information regarding copyright ownership.
005 * The ASF licenses this file to You under the Apache License, Version 2.0
006 * (the "License"); you may not use this file except in compliance with
007 * the License.  You may obtain a copy of the License at
008 *
009 *      http://www.apache.org/licenses/LICENSE-2.0
010 *
011 * Unless required by applicable law or agreed to in writing, software
012 * distributed under the License is distributed on an "AS IS" BASIS,
013 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
014 * See the License for the specific language governing permissions and
015 * limitations under the License.
016 */
017
018package org.apache.commons.rng.core.source64;
019
020import java.util.stream.Stream;
021import org.apache.commons.rng.JumpableUniformRandomProvider;
022import org.apache.commons.rng.SplittableUniformRandomProvider;
023import org.apache.commons.rng.UniformRandomProvider;
024import org.apache.commons.rng.core.util.NumberFactory;
025import org.apache.commons.rng.core.util.RandomStreams;
026
027/**
028 * A 64-bit all purpose generator.
029 *
030 * <p>This is a member of the LXM family of generators: L=Linear congruential generator;
031 * X=Xor based generator; and M=Mix. This member uses a 128-bit LCG and 1024-bit Xor-based
032 * generator. It is named as {@code "L128X1024MixRandom"} in the {@code java.util.random}
033 * package introduced in JDK 17; the LXM family is described in further detail in:
034 *
035 * <blockquote>Steele and Vigna (2021) LXM: better splittable pseudorandom number generators
036 * (and almost as fast). Proceedings of the ACM on Programming Languages, Volume 5,
037 * Article 148, pp 1–31.</blockquote>
038 *
039 * <p>Memory footprint is 1312 bits and the period is 2<sup>128</sup> (2<sup>1024</sup> - 1).
040 *
041 * <p>This generator implements
042 * {@link org.apache.commons.rng.LongJumpableUniformRandomProvider LongJumpableUniformRandomProvider}.
043 * In addition instances created with a different additive parameter for the LCG are robust
044 * against accidental correlation in a multi-threaded setting. The additive parameters must be
045 * different in the most significant 127-bits.
046 *
047 * <p>This generator implements
048 * {@link org.apache.commons.rng.SplittableUniformRandomProvider SplittableUniformRandomProvider}.
049 * The stream of generators created using the {@code splits} methods support parallelisation
050 * and are robust against accidental correlation by using unique values for the additive parameter
051 * for each instance in the same stream. The primitive streaming methods support parallelisation
052 * but with no assurances of accidental correlation; each thread uses a new instance with a
053 * randomly initialised state.
054 *
055 * @see <a href="https://doi.org/10.1145/3485525">Steele &amp; Vigna (2021) Proc. ACM Programming
056 *      Languages 5, 1-31</a>
057 * @see <a href="https://docs.oracle.com/en/java/javase/17/docs/api/java.base/java/util/random/package-summary.html">
058 *      JDK 17 java.util.random javadoc</a>
059 * @since 1.5
060 */
061public class L128X1024Mix extends AbstractL128 implements SplittableUniformRandomProvider {
062    /** Size of the seed vector. */
063    private static final int SEED_SIZE = 20;
064    /** Size of the XBG state vector. */
065    private static final int XBG_STATE_SIZE = 16;
066    /** Size of the LCG state vector. */
067    private static final int LCG_STATE_SIZE = SEED_SIZE - XBG_STATE_SIZE;
068    /** Low half of 128-bit LCG multiplier. */
069    private static final long ML = LXMSupport.M128L;
070
071    /** State of the XBG. */
072    private final long[] x = new long[XBG_STATE_SIZE];
073    /** Index in "state" array. */
074    private int index;
075
076    /**
077     * Creates a new instance.
078     *
079     * @param seed Initial seed.
080     * If the length is larger than 20, only the first 20 elements will
081     * be used; if smaller, the remaining elements will be automatically
082     * set. A seed containing all zeros in the last 16 elements
083     * will create a non-functional XBG sub-generator and a low
084     * quality output with a period of 2<sup>128</sup>.
085     *
086     * <p>The 1st and 2nd elements are used to set the LCG increment; the least significant bit
087     * is set to odd to ensure a full period LCG. The 3rd and 4th elements are used
088     * to set the LCG state.</p>
089     */
090    public L128X1024Mix(long[] seed) {
091        super(seed = extendSeed(seed, SEED_SIZE));
092        System.arraycopy(seed, SEED_SIZE - XBG_STATE_SIZE, x, 0, XBG_STATE_SIZE);
093        // Initialising to 15 ensures that (index + 1) % 16 == 0 and the
094        // first state picked from the XBG generator is state[0].
095        index = XBG_STATE_SIZE - 1;
096    }
097
098    /**
099     * Creates a copy instance.
100     *
101     * @param source Source to copy.
102     */
103    protected L128X1024Mix(L128X1024Mix source) {
104        super(source);
105        System.arraycopy(source.x, 0, x, 0, XBG_STATE_SIZE);
106        index = source.index;
107    }
108
109    /** {@inheritDoc} */
110    @Override
111    protected byte[] getStateInternal() {
112        final long[] s = new long[XBG_STATE_SIZE + 1];
113        System.arraycopy(x, 0, s, 0, XBG_STATE_SIZE);
114        s[XBG_STATE_SIZE] = index;
115        return composeStateInternal(NumberFactory.makeByteArray(s),
116                                    super.getStateInternal());
117    }
118
119    /** {@inheritDoc} */
120    @Override
121    protected void setStateInternal(byte[] s) {
122        final byte[][] c = splitStateInternal(s, (XBG_STATE_SIZE + 1) * Long.BYTES);
123
124        final long[] tmp = NumberFactory.makeLongArray(c[0]);
125        System.arraycopy(tmp, 0, x, 0, XBG_STATE_SIZE);
126        index = (int) tmp[XBG_STATE_SIZE];
127
128        super.setStateInternal(c[1]);
129    }
130
131    /** {@inheritDoc} */
132    @Override
133    public long next() {
134        // LXM generate.
135        // Old state is used for the output allowing parallel pipelining
136        // on processors that support multiple concurrent instructions.
137
138        final int q = index;
139        index = (q + 1) & 15;
140        final long s0 = x[index];
141        long s15 = x[q];
142        final long sh = lsh;
143
144        // Mix
145        final long z = LXMSupport.lea64(sh + s0);
146
147        // LCG update
148        // The LCG is, in effect, "s = m * s + a" where m = ((1LL << 64) + ML)
149        final long sl = lsl;
150        final long al = lal;
151        final long u = ML * sl;
152        // High half
153        lsh = ML * sh + LXMSupport.unsignedMultiplyHigh(ML, sl) + sl + lah +
154              // Carry propagation
155              LXMSupport.unsignedAddHigh(u, al);
156        // Low half
157        lsl = u + al;
158
159        // XBG update
160        s15 ^= s0;
161        x[q] = Long.rotateLeft(s0, 25) ^ s15 ^ (s15 << 27);
162        x[index] = Long.rotateLeft(s15, 36);
163
164        return z;
165    }
166
167    /**
168     * {@inheritDoc}
169     *
170     * <p>The jump size is the equivalent of moving the state <em>backwards</em> by
171     * (2<sup>1024</sup> - 1) positions. It can provide up to 2<sup>128</sup>
172     * non-overlapping subsequences.
173     */
174    @Override
175    public UniformRandomProvider jump() {
176        return super.jump();
177    }
178
179    /**
180     * {@inheritDoc}
181     *
182     * <p>The jump size is the equivalent of moving the state <em>backwards</em> by
183     * 2<sup>64</sup> (2<sup>1024</sup> - 1) positions. It can provide up to
184     * 2<sup>64</sup> non-overlapping subsequences of length 2<sup>64</sup>
185     * (2<sup>1024</sup> - 1); each subsequence can provide up to 2<sup>64</sup>
186     * non-overlapping subsequences of length (2<sup>1024</sup> - 1) using the
187     * {@link #jump()} method.
188     */
189    @Override
190    public JumpableUniformRandomProvider longJump() {
191        return super.longJump();
192    }
193
194    /** {@inheritDoc} */
195    @Override
196    AbstractL128 copy() {
197        // This exists to ensure the jump function performed in the super class returns
198        // the correct class type. It should not be public.
199        return new L128X1024Mix(this);
200    }
201
202    /** {@inheritDoc} */
203    @Override
204    public SplittableUniformRandomProvider split(UniformRandomProvider source) {
205        return create(source.nextLong(), source);
206    }
207
208    /** {@inheritDoc} */
209    @Override
210    public Stream<SplittableUniformRandomProvider> splits(long streamSize, SplittableUniformRandomProvider source) {
211        return RandomStreams.generateWithSeed(streamSize, source, L128X1024Mix::create);
212    }
213
214    /**
215     * Create a new instance using the given {@code seed} and {@code source} of randomness
216     * to initialise the instance.
217     *
218     * @param seed Seed used to initialise the instance.
219     * @param source Source of randomness used to initialise the instance.
220     * @return A new instance.
221     */
222    private static SplittableUniformRandomProvider create(long seed, UniformRandomProvider source) {
223        final long[] s = new long[SEED_SIZE];
224        // LCG state. The addition lower-half uses the input seed.
225        // The LCG addition parameter is set to odd so left-shift the seed.
226        s[0] = source.nextLong();
227        s[1] = seed << 1;
228        s[2] = source.nextLong();
229        s[3] = source.nextLong();
230        // XBG state must not be all zero
231        long x = 0;
232        for (int i = LCG_STATE_SIZE; i < s.length; i++) {
233            s[i] = source.nextLong();
234            x |= s[i];
235        }
236        if (x == 0) {
237            // SplitMix style seed ensures at least one non-zero value
238            x = s[LCG_STATE_SIZE - 1];
239            for (int i = LCG_STATE_SIZE; i < s.length; i++) {
240                s[i] = LXMSupport.lea64(x);
241                x += LXMSupport.GOLDEN_RATIO_64;
242            }
243        }
244        return new L128X1024Mix(s);
245    }
246}