EntropyString
diff --git a/‎.swift-version
Lines changed: 1 addition & 0 deletions b/‎.swift-version
Lines changed: 1 addition & 0 deletions
diff --git a/‎Entropy.playground/Pages/Character Bases.xcplaygroundpage/Contents.swift
Lines changed: 39 additions & 0 deletions b/‎Entropy.playground/Pages/Character Bases.xcplaygroundpage/Contents.swift
Lines changed: 39 additions & 0 deletions
diff --git a/‎Entropy.playground/Pages/Custom Bytes.xcplaygroundpage/Contents.swift
Lines changed: 28 additions & 0 deletions b/‎Entropy.playground/Pages/Custom Bytes.xcplaygroundpage/Contents.swift
Lines changed: 28 additions & 0 deletions
diff --git a/‎Entropy.playground/Pages/Custom Characters.xcplaygroundpage/Contents.swift
Lines changed: 44 additions & 0 deletions b/‎Entropy.playground/Pages/Custom Characters.xcplaygroundpage/Contents.swift
Lines changed: 44 additions & 0 deletions
diff --git a/‎Entropy.playground/Pages/Efficiency.xcplaygroundpage/Contents.swift
Lines changed: 49 additions & 0 deletions b/‎Entropy.playground/Pages/Efficiency.xcplaygroundpage/Contents.swift
Lines changed: 49 additions & 0 deletions
diff --git a/‎Entropy.playground/Pages/More Examples.xcplaygroundpage/Contents.swift
Lines changed: 64 additions & 0 deletions b/‎Entropy.playground/Pages/More Examples.xcplaygroundpage/Contents.swift
Lines changed: 64 additions & 0 deletions
diff --git a/‎Entropy.playground/Pages/Overview.xcplaygroundpage/Contents.swift
Lines changed: 32 additions & 0 deletions b/‎Entropy.playground/Pages/Overview.xcplaygroundpage/Contents.swift
Lines changed: 32 additions & 0 deletions
diff --git a/‎Entropy.playground/Pages/Real Need.xcplaygroundpage/Contents.swift
Lines changed: 88 additions & 0 deletions b/‎Entropy.playground/Pages/Real Need.xcplaygroundpage/Contents.swift
Lines changed: 88 additions & 0 deletions
diff --git a/‎Entropy.playground/Pages/Secure Bytes.xcplaygroundpage/Contents.swift
Lines changed: 37 additions & 0 deletions b/‎Entropy.playground/Pages/Secure Bytes.xcplaygroundpage/Contents.swift
Lines changed: 37 additions & 0 deletions
@@ -0,0 +1 @@
+3.0
@@ -0,0 +1,39 @@
+//: [Previous](@previous)
+//: ## Character Bases
+//:
+//: As we've seen in the previous sections, `EntropyString` provides default characters for each of
+//: the supported bases. Let's see what's under the hood.
+import EntropyString
+
+print("Base 64: \(RandomString.characters(for: .base64))\n")
+//: The call to `RandomString.characters(for:)` returns the characters used for any of the
+//: bases defined by the `RandomString.CharBase enum`. The following code reveals all the
+//: character bases.
+print("Base 32: \(RandomString.characters(for: .base32))\n")
+print("Base 16: \(RandomString.characters(for: .base16))\n")
+print("Base  8: \(RandomString.characters(for: .base8))\n")
+print("Base  4: \(RandomString.characters(for: .base4))\n")
+print("Base  2: \(RandomString.characters(for: .base2))\n")
+//: The default character bases were chosen as follows:
+//:  - Base 64: **ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-_**
+//:     - The file system and URL safe char set from
+//:       [RFC 4648](https://tools.ietf.org/html/rfc4648#section-5).
+//:  - Base 32: **2346789bdfghjmnpqrtBDFGHJLMNPQRT**
+//:      * Remove all upper and lower case vowels (including y)
+//:      * Remove all numbers that look like letters
+//:      * Remove all letters that look like numbers
+//:      * Remove all letters that have poor distinction between upper and lower case values.
+//:      * The resulting strings don't look like English words and are easy to parse visually.
+//:  - Base 16: **0123456789abcdef**
+//:     - Hexadecimal
+//:  - Base  8: **01234567**
+//:     - Octal
+//:  - Base  4: **ATCG**
+//:     - DNA alphabet. No good reason; just wanted to get away from the obvious.
+//:  - Base  2: **01**
+//:     - Binary
+//:
+//: You may, of course, want to choose the characters used, which is covered next in [Custom
+//: Characters](Custom%20Characters).
+//:
+//: [TOC](Table%20of%20Contents) | [Next](@next)
@@ -0,0 +1,28 @@
+//: [Previous](@previous)
+//: ## Custom Bytes
+//:
+//: As described in [Secure Bytes](Secure%20Bytes), `EntropyString` automatically generates random
+//: bytes using either `SecRandomCopyBuf` or `arc4random_buf`. These functions are fine, but you
+//: may have a need to provide your own btyes, say for deterministic testing or to use a
+//: specialized byte genterator. The `RandomString.entropy(of:using:bytes)` function allows 
+//: passing in your own bytes to create a string.
+import EntropyString
+
+let bytes: RandomString.Bytes = [250, 200, 150, 100]
+let string = try! RandomString.entropy(of: 30, using: .base32, bytes: bytes)
+print("String: \(string)\n")
+//: * callout(string): Th7fjL
+//:
+//: The __bytes__ provided can come from any source. However, the number of bytes must be
+//: sufficient to generate the string as described in the [Efficiency](Efficiency) section.
+//: `RandomString.entropy(of:using:bytes)` throws `RandomString.RandomError.tooFewBytes` if
+//: the string cannot be formed from the passed bytes.
+do {
+  try RandomString.entropy(of: 32, using: .base32, bytes: bytes)
+}
+catch {
+  print(error)
+}
+//: * callout(error): tooFewBytes
+//:
+//: [TOC](Table%20of%20Contents)
@@ -0,0 +1,44 @@
+//: [Previous](@previous)
+//: ## Custom Characters
+//:
+//: Being able to easily generate random strings is great, but what if you want to specify your
+//: own characters. For example, suppose you want to visualize flipping a coin to produce entropy
+//: of 10 bits.
+import EntropyString
+
+let randomString = RandomString()
+var flips = randomString.entropy(of: 10, using: .base2)
+print("flips: \(flips)\n")
+//: * callout(flips): 0101001110
+//:
+//: The resulting string of __0__'s and __1__'s doesn't look quite right. You want to use the
+//: characters __H__ and __T__ instead.
+try! randomString.use("HT", for: .base2)
+flips = randomString.entropy(of: 10, using: .base2)
+print("flips: \(flips)\n")
+//: * callout(flips): HTTTHHTTHH
+//:
+//: Note that setting custom characters in the above code requires using an *instance* of
+//: `RandomString`, wheras in the previous sections we used *class* functions for all calls. The
+//: function signatures are the same in each case, but you can't change the static character bases
+//: used in the class `RandomString` (i.e., there is no `RandomString.use(_,for:)` function).
+//:
+//: As another example, we saw in [Character Bases](Character%20Bases) the default characters for
+//: base 16 are **01234567890abcdef**. Suppose you like uppercase hexadecimal letters instead.
+try! randomString.use("0123456789ABCDEF", for: .base16)
+let hex = randomString.entropy(of: 48, using: .base16)
+print("hex: \(hex)\n")
+//: * callout(hex): 4D20D9AA862C
+//:
+//: Or suppose you want a random password with numbers, lowercase letters and special characters.
+try! randomString.use("1234567890abcdefghijklmnopqrstuvwxyz-=[];,./~!@#$%^&*()_+{}|:<>?", for: .base64)
+let password = randomString.entropy(of: 64, using: .base64)
+print("password: \(password)")
+//: * callout(password): }4?0x*$o_=w
+//:
+//: Note that `randomString.use(_,for:)` can throw an `Error`. The throw is actually a
+//: `RandomStringError` and will occur if the number of characters doesn't match the number
+//: required for the base or if the characters are not all unique. The section on [Unique
+//: Characters](Unique%20Characters) discusses these errors further.
+//:
+//: [TOC](Table%20of%20Contents) | [Next](@next)
@@ -0,0 +1,49 @@
+//: [Previous](@previous)
+//: ## Efficiency
+//:
+//: To efficiently create random strings, `EntropyString` generates the necessary number of
+//: bytes needed for each the string and uses those bytes in a bit shifting scheme to index into
+//: a character base. For example, consider generating strings from the `.base32` character
+//: base. There are __32__ characters in the base, so an index into an array of those characters
+//: would be in the range `[0,31]`. Generating a random string of `.base32` characters is thus
+//: reduced to generating a random sequence of indices in the range `[0,31]`.
+//:
+//: To generate the indices, `EntropyString` slices just enough bits from the array of bytes to create
+//: each index. In the example at hand, 5 bits are needed to create an index in the range
+//: `[0,31]`. `EntropyString` processes the byte array 5 bits at a time to create the indices. The first
+//: index comes from the first 5 bits of the first byte, the second index comes from the last 3 bits of
+//: the first byte combined with the first 2 bits of the second byte, and so on as the byte array is
+//: systematically sliced to form indices into the character base. And since bit shifting and addition
+//: of byte values is really efficient, this scheme is quite fast.
+//:
+//: The `EntropyString` scheme is also efficient with regard to the amount of randomness used. Consider
+//: the following common solution to generating random strings. To generated a character, an index into
+//: the available characters is create using `arc4random_uniform`. The code looks something like:
+//:
+//:    for _ in 0..<len {
+//:      let offset = Int(arc4random_uniform(charCount))
+//:      let index = chars.index(chars.startIndex, offsetBy: offset)
+//:      let char = chars[index]
+//:      string += String(char)
+//:    }
+//:
+//: `arc4random_uniform` generates 32 bits of randomness, returned as an UInt32. The returned value is
+//: used to create an **index**. Suppose we're creating strings of **len** 16 using a **charCount**
+//: of 32. Each **char** consumes 32 bits of randomness (generated by `archrandom_uniform` per
+//: character) while only injecting 5 bits of entropy into **string**. But a string of length 16 using
+//: 32 possible characters has an entropy carrying capacity of 80 bits. So creating each **string**
+//: requires a total of 512 bits of randomness while only actually carrying 80 bits of that entropy
+//: forward in the string itself. That means 432 bits (84% of the total) of the generated randomness is
+//: simply thrown away.
+//:
+//: Compare that to the `EntropyString` scheme. For the example above, slicing off 5 bits at a time
+//: requires a total of 80 bits (10 bytes). Creating the same strings as above, `EntropyString` uses 80
+//: bits of randomness per string with no wasted bits. In general, the `EntropyString` scheme can waste
+//: up to 7 bits per string, but that's the worst case scenario and that's *per string*, not *per
+//: character*!
+//:
+//: Fortunately you don't need to really understand how the bytes are efficiently sliced and diced to get
+//: the string. But you may want to know that [Secure Bytes](#SecureBytes) are used, and that's the next
+//: topic.
+//:
+//: [TOC](Table%20of%20Contents) | [Next](@next)
@@ -0,0 +1,64 @@
+//: [Previous](@previous)
+//: ## More Examples
+//:
+//: In [Real Need](Real%20Need) our developer used hexadecimal characters for the strings.
+//: Let's look at using other characters instead.
+//:
+//: We'll start with using 32 characters. What 32 characters, you ask? Well, the [Character
+//: Bases](Character%20Bases) section discusses the default characters available in `EntropyString`
+//: and the [Custom Characters](Custom%20Characters) section describes how you can use whatever
+//: characters you want. For now we'll stick to the provided defaults.
+import EntropyString
+
+var bits = Entropy.bits(total: 10000, risk: .ten06)
+var string = RandomString.entropy(of: bits, using: .base32)
+print("String: \(string)\n")
+//: * callout(string): PmgMJrdp9h
+//: 
+//: We're using the same __bits__ calculation since we haven't changed the number of IDs or the
+//: accepted risk of probabilistic uniqueness. But this time we use 32 characters and our resulting
+//: ID only requires 10 characters (and can carry 50 bits of entropy, which as when we used 16
+//: characters, is more than the required 45.51).
+//:
+//: Now let's suppose we need to ensure the names of a handful of items are unique.  Let's say 30
+//: items. And let's decide we can live with a 1 in 100,000 probability of collision (we're just
+//: futzing with some code ideas). Using hex characters we get:
+bits = Entropy.bits(total: 30, risk: .ten05)
+string = RandomString.entropy(of: bits, using: .base16)
+print("String: \(string)\n")
+//: * callout(string): 766923a
+//:
+//: Using base 4 characters we get:
+string = RandomString.entropy(of: bits, using: .base4)
+print("String: \(string)\n")
+//: * callout(string): GCGTCGGGTTTTA
+//:
+//: Okay, we probably wouldn't use base 4 (and what's up with those characters?), but you get the
+//: idea.
+//:
+//: Suppose we have a more extreme need. We want less than a 1 in a trillion chance that 10
+//: billion strings of 32 characters repeat. Let's see, our risk (trillion) is 10 to the 12th and
+//: our total (10 billion) is 10 to the 10th, so:
+//:
+bits = Entropy.bits(total: .ten10, risk: .ten12)
+string = RandomString.entropy(of: bits, using: .base32)
+print("String: \(string)\n")
+//: * callout(string): F78PmfGRNfJrhHGTqpt6Hn
+//:
+//: Finally, let say we're generating session IDs. We're not interested in uniqueness per se, but in
+//: ensuring our IDs aren't predicatable since we can't have the bad guys guessing a valid ID. In
+//: this case, we're using entropy as a measure of unpredictability of the IDs. Rather than calculate
+//: our entropy, we declare it needs to be 128 bits (since we read on some web site that session IDs
+//: should be 128 bits).
+string = RandomString.entropy(of: 128, using: .base64)
+print("String: \(string)\n")
+//: * callout(string): b0Gnh6H5cKCjWrCLwKoeuN
+//:
+//: Using 64 characters, our string length is 22 characters. That's actually 132 bits, so we've got
+//: our OWASP requirement covered! 😌
+//:
+//: Also note that we covered our need using strings that are only 22 characters in length. So long
+//: to using GUID strings which only carry 122 bits of entropy (for the commonly used version 4
+//: anyway) and use string representations (hex and dashes) that are 36 characters in length.
+//:
+//: [TOC](Table%20of%20Contents) | [Next](@next)
@@ -0,0 +1,32 @@
+//: [Previous](@previous)
+//:
+//: ## Overview
+//:
+//: `EntropyString` provides easy creation of randomly generated strings of specific entropy using
+//: various character bases. Such strings are needed when generating, for example, random IDs and
+//: you don't want the overkill of a GUID, or for ensuring that some number of items have unique
+//: names.
+//:
+//: A key concern when generating such strings is that they be unique. To truly guarantee uniqueness
+//: requires that each newly created string be compared against all existing strings. The overhead
+//: of storing and comparing strings in this manner is often too onerous and a different strategy is
+//: desired.
+//:
+//: A common strategy is to replace the *guarantee of uniqueness* with a weaker but hopefully
+//: sufficient *probabilistic uniqueness*. Specifically, rather than being absolutely sure of
+//: uniqueness, we settle for a statement such as *"there is less than a 1 in a billion chance that
+//: two of my strings are the same"*. This strategy requires much less overhead, but does require
+//: we have some manner of qualifying what we mean by, for example, *"there is less than a 1 in a
+//: billion chance that 1 million strings of this form will have a repeat"*.
+//:
+//: Understanding probabilistic uniqueness requires some understanding of
+//: [*entropy*](https://en.wikipedia.org/wiki/Entropy_(information_theory)) and of estimating the
+//: probability of a
+//: [*collision*](https://en.wikipedia.org/wiki/Birthday_problem#Cast_as_a_collision_problem) (i.e.,
+//: the probability that two strings in a set of randomly generated strings might be the same).
+//: Happily, you can use `EntropyString` without a deep understanding of these topics.
+//:
+//: We'll begin investigating `EntropyString` by considering our [Real Need](Real%20Need) when
+//: generating random strings.
+//:
+//: [TOC](Table%20of%20Contents) | [Next](@next)
@@ -0,0 +1,88 @@
+//: [Previous](@previous)
+//: ## Real Need
+//:
+//: Let's start by reflecting on a common developer statement of need:
+//:
+//: *I need random strings 16 characters long.*
+//:
+//: Okay. There are libraries available that address that exact need. But first, there are some
+//: questions that arise from the need as stated, such as:
+//:
+//:  1. What characters do you want to use?
+//:  2. How many of these strings do you need?
+//:  3. Why do you need these strings?
+//:
+//: The available libraries often let you specify the characters to use. So we can assume for now
+//: that question 1 is answered with:
+//:
+//: *Hexadecimal IDs will do fine*.
+//:
+//: As for question 2, the developer might respond:
+//:
+//: *I need 10,000 of these things*.
+//:
+//: Ah, now we're getting somewhere. The answer to question 3 might lead to the further qualification:
+//:
+//: *I need to generate 10,000 random, unique IDs*.
+//:
+//: And the cat's out of the bag. We're getting at the real need, and it's not the same as the original
+//: statement. The developer needs *uniqueness* across a total of some number of strings. The length of
+//: the string is a by-product of the uniqueness, not the goal.
+//: 
+//: As noted in the [Overview](Overview), guaranteeing uniqueness is difficult, so we'll replace that
+//: declaration with one of *probabilistic uniqueness* by asking:
+//:
+//:   4. What risk of a repeat are you willing to accept?
+//:
+//: Probabilistic uniqueness contains risk. That's the price we pay for giving up on the stronger
+//: declaration of strict uniqueness. But the developer can quantify an appropriate risk for a
+//: particular scenario with a statement like:
+//:
+//: *I guess I can live with a 1 in a million chance of a repeat*.
+//:
+//: So now we've gotten to the real need:
+//:
+//: *I need 10,000 random hexadecimal IDs with less than 1 in a million chance of any repeats*.
+//:
+//: How do you address this need using a library designed to generate strings of specified length?
+//: Well, you don't directly, because that library was designed to answer the originally stated need,
+//: not the real need we've uncovered. We need a library that deals with probabilistic uniqueness
+//: of a total number of some strings. And that's exactly what `EntropyString` does.
+//:
+//: Let's use `EntropyString` to help this developer:
+import EntropyString
+
+let bits = Entropy.bits(total: 10000, risk: .ten06)
+var strings = [String]()
+for i in 0 ..< 5 {
+  let string = RandomString.entropy(of: bits, using: .base16)
+  strings.append(string)
+}
+print("Strings: \(strings)")
+//: * callout(strings): ["85e442fa0e83", "a74dc126af1e", "368cd13b1f6e", "81bf94e1278d", "fe7dec099ac9"]
+//:
+//: To generate the IDs, we first use
+//:
+//: ```swift
+//:   let bits = Entropy.bits(total: 10000, risk: .ten06)
+//: ```
+//:
+//: to determine the bits of entropy needed to satisfy our probabilistic uniqueness of **10,000**
+//: strings with a **1 in a million** (ten to the sixth power) risk of repeat. We didn't print the
+//: result, but if you did you'd see it's about **45.51**. Then inside a loop we used
+//:
+//: ```swift
+//:   let string = RandomString.entropy(of: bits, using: .base16)
+//: ```
+//:
+//: to actually generate random strings using hexadecimal (base16) characters. Looking at the IDs, we can
+//: see each is 12 characters long. Again, the string length is a by-product of the characters used to
+//: represent the entropy we needed. And it seems the developer didn't really need 16 characters after all.
+//:
+//: Finally, given that the strings are 12 hexadecimals long, each string actually has an
+//: information carrying capacity of 12 * 4 = 48 bits of entropy (a hexadecimal character carries 4
+//: bits). That's fine. Assuming all characters are equally probable, a string can only carry entropy
+//: equal to a multiple of the amount of entropy represented per character. `EntropyString` produces
+//: the smallest strings that *exceed* the specified entropy.
+//:
+//: [TOC](Table%20of%20Contents) | [Next](@next)
@@ -0,0 +1,37 @@
+//: [Previous](@previous)
+//: ## Secure Bytes
+//:
+//: As described in [Efficiency](Efficiency), `EntropyString` uses an underlying array of
+//: bytes to generate strings. The entropy of the resulting strings is, of course, directly
+//: tied to the randomness of the bytes used. That's an important point. Strings are only capable
+//: of carrying information (entropy), it's the random bytes that actually provide the entropy
+//: itself.
+//:
+//: `EntropyString` automatically generates the necessary number of bytes needed for the
+//: strings using either `SecRandomCopyBytes` or `arc4random_buf`, both of which produce
+//: cryptographically-secure random byte. `SecRandomCopyBytes` is the stronger of the two,
+//: but can fail. Rather than propagate that failure, if `SecRandomCopyBytes` fails
+//: `EntropyString` falls back and uses`arc4random_buf` to generate the bytes. Though not as
+//: secure, `arc4random_buf` does not fail.
+//:
+//: You may, however, want to know which routine was used to generate the underlying bytes for a
+//: string. `RandomString` provides an additional `inout` parameter in the
+//: `RandomString.entropy(for:using:secure)` function for this purpose.
+import EntropyString
+
+var secure = true
+RandomString.entropy(of: 20, using: .base32, secure: &secure)
+print("secure: \(secure)")
+//: * callout(secure): true
+//:
+//: If `SecRandomCopyBytes` is used, the __secure__ parameter will remain `true`; otherwise it
+//: will be flipped to `false`.
+//:
+//: You can also pass in __secure__ as `false`, in which case the `entropy` call will not
+//: attempt to use `SecRandomCopyBytes` and will use `arc4random_buf` instead.
+secure = false
+RandomString.entropy(of: 20, using: .base32, secure: &secure)
+//: Rather than have `EntropyString` generate bytes automatically, you can provide your own [Custom
+//: Bytes](Custom%20Bytes) to create a string, which is the next topic.
+//:
+//: [TOC](Table%20of%20Contents) | [Next](@next)