From b8fedea0cfc1cb9cb7f66069b5620b8bd2cbbd19 Mon Sep 17 00:00:00 2001 From: Bas Broek Date: Fri, 2 Dec 2016 11:04:46 +0100 Subject: [PATCH 01/11] Add support for counting syllables --- Analysis/Classes/Analysis.swift | 17 +++ Analysis/Classes/SyllableCounter.swift | 203 +++++++++++++++++++++++++ Example/Tests/AnalysisTests.swift | 16 ++ 3 files changed, 236 insertions(+) create mode 100755 Analysis/Classes/SyllableCounter.swift diff --git a/Analysis/Classes/Analysis.swift b/Analysis/Classes/Analysis.swift index d8b18b4..60753f9 100644 --- a/Analysis/Classes/Analysis.swift +++ b/Analysis/Classes/Analysis.swift @@ -63,6 +63,13 @@ public struct Analysis { } } + /// Returns the total amount of syllables of the `input`. + public func syllableCount() -> Int { + return words + .map { $0.syllables } + .reduce(0, +) + } + /// Returns the character count of the `input`. /// /// - Parameter includingSpaces: Indicating if characters @@ -138,6 +145,16 @@ public struct Analysis { .filter { $0 == character }.count } + /// Returns the syllables of every unique word. + public func wordSyllables() -> [String: Int] { + var syllables: [String: Int] = [:] + let uniqueWords = Array(_wordOccurrences(caseSensitive: false).keys) + + uniqueWords.forEach { syllables[$0] = $0.syllables } + + return syllables + } + /// Returns the frequency of the specified word. /// /// - Parameter caseSensitive: Indicating if words diff --git a/Analysis/Classes/SyllableCounter.swift b/Analysis/Classes/SyllableCounter.swift new file mode 100755 index 0000000..bbd6ae8 --- /dev/null +++ b/Analysis/Classes/SyllableCounter.swift @@ -0,0 +1,203 @@ +// +// SyllableCounter.swift +// +// Created by Warren Freitag on 2/14/16. +// Copyright © 2016 Warren Freitag. All rights reserved. +// Licensed under the Apache 2.0 License. +// +// Adapted from a Java implementation created by Hugo "m09" Mougard. +// https://github.com/m09/syllable-counter +// + +import UIKit + +public class SyllableCounter { + + // MARK: - Shared instance + + public static let shared = SyllableCounter() + + // MARK: - Private properties + + private var exceptions: [String: Int] = [ + "brutes": 1, + "chummed": 1, + "flapped": 1, + "foamed": 1, + "gaped": 1, + "h'm": 1, + "lb": 1, + "mimes": 1, + "ms": 1, + "peeped": 1, + "sheered": 1, + "st": 1, + "queue": 1, + "none": 1, + "leaves": 1, + "awesome": 2, + "60": 2, + "capered": 2, + "caressed": 2, + "clattered": 2, + "deafened": 2, + "dr": 2, + "effaced": 2, + "effaces": 2, + "fringed": 2, + "greyish": 2, + "jr": 2, + "mangroves": 2, + "messieurs": 2, + "motioned": 2, + "moustaches": 2, + "mr": 2, + "mrs": 2, + "pencilled": 2, + "poleman": 2, + "quivered": 2, + "reclined": 2, + "shivered": 2, + "sidespring": 2, + "slandered": 2, + "sombre": 2, + "sr": 2, + "stammered": 2, + "suavely": 2, + "tottered": 2, + "trespassed": 2, + "truckle": 2, + "unstained": 2, + "therefore": 2, + "businesses": 3, + "bottleful": 3, + "discoloured": 3, + "disinterred": 3, + "hemispheres": 3, + "manoeuvred": 3, + "sepulchre": 3, + "shamefully": 3, + "unexpressed": 3, + "veriest": 3, + "wyoming": 3, + "etc": 4, + "sailmaker": 4, + "satiated": 4, + "sententiously": 4, + "particularized": 5, + "unostentatious": 5, + "propitiatory": 6, + ] + + private var addSyllables: [NSRegularExpression]! + private var subSyllables: [NSRegularExpression]! + + private let vowels: Set = ["a", "e", "i", "o", "u", "y"] + + // MARK: - Error enum + + private enum SyllableCounterError: Error { + case badRegex(String) + case badExceptionsData(String) + } + + // MARK: - Constructors + + public init() { + do { + try populateAddSyllables() + try populateSubSyllables() + } + catch SyllableCounterError.badRegex(let pattern) { + print("Bad Regex pattern: \(pattern)") + } + catch SyllableCounterError.badExceptionsData(let info) { + print("Problem parsing exceptions dataset: \(info)") + } + catch { + print("An unexpected error occured while initializing the syllable counter.") + } + } + + // MARK: - Setup + + private func populateAddSyllables() throws { + try addSyllables = buildRegexes(forPatterns: [ + "ia", "riet", "dien", "iu", "io", "ii", + "[aeiouy]bl$", "mbl$", "tl$", "sl$", "[aeiou]{3}", + "^mc", "ism$", "(.)(?!\\1)([aeiouy])\\2l$", "[^l]llien", "^coad.", + "^coag.", "^coal.", "^coax.", "(.)(?!\\1)[gq]ua(.)(?!\\2)[aeiou]", "dnt$", + "thm$", "ier$", "iest$", "[^aeiou][aeiouy]ing$"]) + } + + private func populateSubSyllables() throws { + try subSyllables = buildRegexes(forPatterns: [ + "cial", "cian", "tia", "cius", "cious", + "gui", "ion", "iou", "sia$", ".ely$", + "ves$", "geous$", "gious$", "[^aeiou]eful$", ".red$"]) + } + + private func buildRegexes(forPatterns patterns: [String]) throws -> [NSRegularExpression] { + return try patterns.map { pattern -> NSRegularExpression in + do { + let regex = try NSRegularExpression(pattern: pattern, options: [.caseInsensitive, .anchorsMatchLines]) + return regex + } + catch { + throw SyllableCounterError.badRegex(pattern) + } + } + } + + // MARK: - Public methods + + internal func count(word: String) -> Int { + if word.characters.count <= 1 { + return word.characters.count + } + + var mutatedWord = word.lowercased(with: Locale(identifier: "en_US")).trimmingCharacters(in: .punctuationCharacters) + + if let exceptionValue = exceptions[mutatedWord] { + return exceptionValue + } + + if mutatedWord.characters.last == "e" { + mutatedWord = String(mutatedWord.characters.dropLast()) + } + + var count = 0 + var previousIsVowel = false + + for character in mutatedWord.characters { + let isVowel = vowels.contains(character) + if isVowel && !previousIsVowel { + count += 1 + } + previousIsVowel = isVowel + } + + for pattern in addSyllables { + let matches = pattern.matches(in: mutatedWord, options: NSRegularExpression.MatchingOptions(rawValue: 0), range: NSRange(location: 0, length: mutatedWord.characters.count)) + if !matches.isEmpty { + count += 1 + } + } + + for pattern in subSyllables { + let matches = pattern.matches(in: mutatedWord, options: NSRegularExpression.MatchingOptions(rawValue: 0), range: NSRange(location: 0, length: mutatedWord.characters.count)) + if !matches.isEmpty { + count -= 1 + } + } + + return (count > 0) ? count : 1 + } +} + +extension String { + + internal var syllables: Int { + return SyllableCounter.shared.count(word: self) + } +} diff --git a/Example/Tests/AnalysisTests.swift b/Example/Tests/AnalysisTests.swift index 912bad6..6f9cd8d 100644 --- a/Example/Tests/AnalysisTests.swift +++ b/Example/Tests/AnalysisTests.swift @@ -158,4 +158,20 @@ class AnalysisTests: XCTestCase { XCTAssertEqual(helloWorld1.averageWordsPerSentence, 2.0) XCTAssertEqual(repeating.averageWordsPerSentence, 3.0) } + + func testSyllableCount() { + XCTAssertEqual(helloWorld1.syllableCount(), 3) + XCTAssertEqual(helloWorld2.syllableCount(), 3) + XCTAssertEqual(a.syllableCount(), 1) + XCTAssertEqual(z.syllableCount(), 1) + XCTAssertEqual(repeating.syllableCount(), 6) + } + + func testWordSyllables() { + XCTAssertEqual(helloWorld1.wordSyllables(), ["hello": 2, "world": 1]) + XCTAssertEqual(helloWorld2.wordSyllables(), ["hello": 2, "world": 1]) + XCTAssertEqual(a.wordSyllables(), ["a": 1]) + XCTAssertEqual(z.wordSyllables(), ["z": 1]) + XCTAssertEqual(repeating.wordSyllables(), ["repeat": 2]) + } } From 58bb7b37fdd4287ac92832fc0861567e4b899ff1 Mon Sep 17 00:00:00 2001 From: Bas Broek Date: Fri, 2 Dec 2016 11:05:27 +0100 Subject: [PATCH 02/11] Add support for Flesch Reading Ease score and Flesch-Kincaid Grade Level --- Analysis/Classes/Analysis.swift | 23 +++++++++++++++++++++++ 1 file changed, 23 insertions(+) diff --git a/Analysis/Classes/Analysis.swift b/Analysis/Classes/Analysis.swift index 60753f9..5c1b7d5 100644 --- a/Analysis/Classes/Analysis.swift +++ b/Analysis/Classes/Analysis.swift @@ -17,6 +17,7 @@ public enum LengthOption { /// An analysis of a `String`. public struct Analysis { public typealias Percentage = Double + public typealias Grade = Double /// The string used to construct the `Analysis`. public let input: String @@ -201,6 +202,28 @@ public struct Analysis { public var averageWordsPerSentence: Double { return Double(wordCount()) / Double(sentenceCount()) } + + private var _wordsPerSentences: Double { + return Double(wordCount()) / Double(sentenceCount()) + } + + private var _syllablesPerWords: Double { + return Double(syllableCount()) / Double(wordCount()) + } + + /// Returns the Flesch reading ease score. + /// + /// - Note: https://en.wikipedia.org/wiki/Flesch–Kincaid_readability_tests#Flesch_reading_ease + public func fleschReadingEase() -> Percentage { + return 206.835 - 1.015 * _wordsPerSentences - 84.6 * _syllablesPerWords + } + + /// Returns the Flesch-Kincaid grade level. + /// + /// - Note: https://en.wikipedia.org/wiki/Flesch–Kincaid_readability_tests#Flesch.E2.80.93Kincaid_grade_level + public func fleschKincaidGradeLevel() -> Grade { + return 0.39 * _wordsPerSentences + 11.8 * _syllablesPerWords - 15.59 + } } extension Analysis: Hashable { From b91e636fe27ef5af826516e15dd72c207d59e0c3 Mon Sep 17 00:00:00 2001 From: Bas Broek Date: Fri, 2 Dec 2016 11:05:39 +0100 Subject: [PATCH 03/11] Use an extension to lowercase Character --- Analysis/Classes/Analysis.swift | 6 +++--- Analysis/Classes/Character+Casing.swift | 20 ++++++++++++++++++++ 2 files changed, 23 insertions(+), 3 deletions(-) create mode 100644 Analysis/Classes/Character+Casing.swift diff --git a/Analysis/Classes/Analysis.swift b/Analysis/Classes/Analysis.swift index 5c1b7d5..3e604dd 100644 --- a/Analysis/Classes/Analysis.swift +++ b/Analysis/Classes/Analysis.swift @@ -95,7 +95,7 @@ public struct Analysis { private func _characterOccurences(caseSensitive: Bool = false) -> [Character: Int] { var occurrences: [Character: Int] = [:] characters - .map { (caseSensitive) ? $0 : Character(String(describing: $0).lowercased()) } + .map { (caseSensitive) ? $0 : $0.lowercased() } .forEach { occurrences[$0] = (occurrences[$0] ?? 0) + 1 } return occurrences } @@ -140,9 +140,9 @@ public struct Analysis { /// should be counted regardless of their case sensitivity. /// Defaults to `false`. public func occurrences(of character: Character, caseSensitive: Bool = false) -> Int { - let character = (caseSensitive) ? character : Character(String(describing: character).lowercased()) + let character = (caseSensitive) ? character : character.lowercased() return characters - .map { (caseSensitive) ? $0 : Character(String(describing: $0).lowercased()) } + .map { (caseSensitive) ? $0 : $0.lowercased() } .filter { $0 == character }.count } diff --git a/Analysis/Classes/Character+Casing.swift b/Analysis/Classes/Character+Casing.swift new file mode 100644 index 0000000..608e670 --- /dev/null +++ b/Analysis/Classes/Character+Casing.swift @@ -0,0 +1,20 @@ +// +// Character+Casing.swift +// Pods +// +// Created by Bas Broek on 02/12/2016. +// +// + +import Foundation + +internal extension Character { + + func lowercased() -> Character { + return Character(String(describing: self).lowercased()) + } + + func uppercased() -> Character { + return Character(String(describing: self).uppercased()) + } +} From 1fef404a3f75d446467d51a15e72bb1f322f39a2 Mon Sep 17 00:00:00 2001 From: Bas Broek Date: Fri, 2 Dec 2016 11:24:57 +0100 Subject: [PATCH 04/11] Add syllable and Flesch examples to Readme --- README.md | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/README.md b/README.md index 8d80eca..0ef854b 100644 --- a/README.md +++ b/README.md @@ -46,6 +46,11 @@ analysis.wordOccurrences(caseSensitive: true) // ["You": 1, "are": 1, "awesome", analysis.wordOccurrences(caseSensitive: false) // ["you": 2, "are": 1, "awesome", 1] analysis.frequency(of: "you", caseSensitive: false) // 50.0% analysis.averageCharacters(per: .word) // 5.33 + +analysis.syllableCount() // 5 +analysis.wordSyllables() // ["you": 1, "are": 1, "awesome": 2] +analysis.fleschReadingEase() // 97.025 +analysis.fleschKincaidGradeLevel() // 0.72 ``` You can also easily sort your occurences via an enhanced sorting method on `Dictionary`. From 94cb9fe33dc39a2400f16dd2e91a0428aa7ab35d Mon Sep 17 00:00:00 2001 From: Bas Broek Date: Fri, 2 Dec 2016 11:29:43 +0100 Subject: [PATCH 05/11] Add changelog --- Changelog.md | 9 +++++++++ 1 file changed, 9 insertions(+) create mode 100644 Changelog.md diff --git a/Changelog.md b/Changelog.md new file mode 100644 index 0000000..f792f45 --- /dev/null +++ b/Changelog.md @@ -0,0 +1,9 @@ +# next + +- Added `syllableCount()`, which counts the total amount of syllables of the `input`. +- Added `wordSyllables()`, which returns the syllables of every unique word. +- Added `fleschReadingEase()`, which calculates the [Flesch reading ease score](https://en.wikipedia.org/wiki/Flesch–Kincaid_readability_tests#Flesch_reading_ease). +- Added `fleschKincaidGradeLevel()`, which calculates the [Flesch-Kincaid grade level](https://en.wikipedia.org/wiki/Flesch–Kincaid_readability_tests#Flesch.E2.80.93Kincaid_grade_level). + +# [0.1.0](https://github.com/BasThomas/Analysis/releases/tag/0.1.0) +Initial release. From 81f5d53e49e8f62773eb28efd0553f2527777daf Mon Sep 17 00:00:00 2001 From: Bas Broek Date: Fri, 2 Dec 2016 11:33:54 +0100 Subject: [PATCH 06/11] Fix typo --- Analysis/Classes/Analysis.swift | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Analysis/Classes/Analysis.swift b/Analysis/Classes/Analysis.swift index 3e604dd..5f2d7a4 100644 --- a/Analysis/Classes/Analysis.swift +++ b/Analysis/Classes/Analysis.swift @@ -8,7 +8,7 @@ import Foundation -/// The option to when calculating average length. This is either `.word` or `.sentence`. +/// The option to use when calculating average length. This is either `.word` or `.sentence`. public enum LengthOption { case word case sentence From 86bbeb6b3509924205e359a92cbf55cb20ed18dc Mon Sep 17 00:00:00 2001 From: Bas Broek Date: Fri, 2 Dec 2016 11:35:02 +0100 Subject: [PATCH 07/11] Remove creation information --- Analysis/Classes/Analysis.swift | 8 -------- Analysis/Classes/Character+Casing.swift | 8 -------- Analysis/Classes/Dictionary+Sorting.swift | 8 -------- Analysis/Classes/String+Analysis.swift | 8 -------- Analysis/Classes/SyllableCounter.swift | 2 +- 5 files changed, 1 insertion(+), 33 deletions(-) diff --git a/Analysis/Classes/Analysis.swift b/Analysis/Classes/Analysis.swift index 5f2d7a4..935b3e3 100644 --- a/Analysis/Classes/Analysis.swift +++ b/Analysis/Classes/Analysis.swift @@ -1,11 +1,3 @@ -// -// Analysis.swift -// -// -// Created by Bas Broek on 11/11/2016. -// -// - import Foundation /// The option to use when calculating average length. This is either `.word` or `.sentence`. diff --git a/Analysis/Classes/Character+Casing.swift b/Analysis/Classes/Character+Casing.swift index 608e670..f634bab 100644 --- a/Analysis/Classes/Character+Casing.swift +++ b/Analysis/Classes/Character+Casing.swift @@ -1,11 +1,3 @@ -// -// Character+Casing.swift -// Pods -// -// Created by Bas Broek on 02/12/2016. -// -// - import Foundation internal extension Character { diff --git a/Analysis/Classes/Dictionary+Sorting.swift b/Analysis/Classes/Dictionary+Sorting.swift index 2e29629..aa6267a 100644 --- a/Analysis/Classes/Dictionary+Sorting.swift +++ b/Analysis/Classes/Dictionary+Sorting.swift @@ -1,11 +1,3 @@ -// -// Dictionary+Sorting.swift -// -// -// Created by Bas Broek on 11/11/2016. -// -// - import Foundation /// The sort option of the dictionary. This is either `.key` or `.value`. diff --git a/Analysis/Classes/String+Analysis.swift b/Analysis/Classes/String+Analysis.swift index b8ad4d5..075b655 100644 --- a/Analysis/Classes/String+Analysis.swift +++ b/Analysis/Classes/String+Analysis.swift @@ -1,11 +1,3 @@ -// -// String+Analysis.swift -// -// -// Created by Bas Broek on 11/11/2016. -// -// - import Foundation public extension String { diff --git a/Analysis/Classes/SyllableCounter.swift b/Analysis/Classes/SyllableCounter.swift index bbd6ae8..16d4042 100755 --- a/Analysis/Classes/SyllableCounter.swift +++ b/Analysis/Classes/SyllableCounter.swift @@ -9,7 +9,7 @@ // https://github.com/m09/syllable-counter // -import UIKit +import Foundation public class SyllableCounter { From bb153a0e5bca9a9d8c722a59ee9ed26043af546e Mon Sep 17 00:00:00 2001 From: Bas Broek Date: Fri, 2 Dec 2016 13:16:37 +0100 Subject: [PATCH 08/11] Add syllable count and Flesch-tests to Example app --- Example/Analysis.xcodeproj/project.pbxproj | 4 + Example/Analysis/Analysis.storyboard | 143 ++++++++++++++---- .../AnalysisTableViewController.swift | 40 ++++- .../Analysis/UIViewController+Safari.swift | 32 ++++ 4 files changed, 184 insertions(+), 35 deletions(-) create mode 100644 Example/Analysis/UIViewController+Safari.swift diff --git a/Example/Analysis.xcodeproj/project.pbxproj b/Example/Analysis.xcodeproj/project.pbxproj index 594d646..a7d1bfa 100644 --- a/Example/Analysis.xcodeproj/project.pbxproj +++ b/Example/Analysis.xcodeproj/project.pbxproj @@ -9,6 +9,7 @@ /* Begin PBXBuildFile section */ 4978479C1DD87E4A003CFFBB /* Analysis.storyboard in Resources */ = {isa = PBXBuildFile; fileRef = 4978479B1DD87E4A003CFFBB /* Analysis.storyboard */; }; 4978479E1DD88148003CFFBB /* AnalysisTableViewController.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4978479D1DD88148003CFFBB /* AnalysisTableViewController.swift */; }; + 4985BEC11DF1959500B36F51 /* UIViewController+Safari.swift in Sources */ = {isa = PBXBuildFile; fileRef = 4985BEC01DF1959500B36F51 /* UIViewController+Safari.swift */; }; 607FACD61AFB9204008FA782 /* AppDelegate.swift in Sources */ = {isa = PBXBuildFile; fileRef = 607FACD51AFB9204008FA782 /* AppDelegate.swift */; }; 607FACD81AFB9204008FA782 /* ViewController.swift in Sources */ = {isa = PBXBuildFile; fileRef = 607FACD71AFB9204008FA782 /* ViewController.swift */; }; 607FACDB1AFB9204008FA782 /* Main.storyboard in Resources */ = {isa = PBXBuildFile; fileRef = 607FACD91AFB9204008FA782 /* Main.storyboard */; }; @@ -36,6 +37,7 @@ 45E49C4F9720F93380BF3A10 /* Pods-Analysis_Tests.debug.xcconfig */ = {isa = PBXFileReference; includeInIndex = 1; lastKnownFileType = text.xcconfig; name = "Pods-Analysis_Tests.debug.xcconfig"; path = "Pods/Target Support Files/Pods-Analysis_Tests/Pods-Analysis_Tests.debug.xcconfig"; sourceTree = ""; }; 4978479B1DD87E4A003CFFBB /* Analysis.storyboard */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = file.storyboard; path = Analysis.storyboard; sourceTree = ""; }; 4978479D1DD88148003CFFBB /* AnalysisTableViewController.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = AnalysisTableViewController.swift; sourceTree = ""; }; + 4985BEC01DF1959500B36F51 /* UIViewController+Safari.swift */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.swift; path = "UIViewController+Safari.swift"; sourceTree = ""; }; 607FACD01AFB9204008FA782 /* Analysis_Example.app */ = {isa = PBXFileReference; explicitFileType = wrapper.application; includeInIndex = 0; path = Analysis_Example.app; sourceTree = BUILT_PRODUCTS_DIR; }; 607FACD41AFB9204008FA782 /* Info.plist */ = {isa = PBXFileReference; lastKnownFileType = text.plist.xml; path = Info.plist; sourceTree = ""; }; 607FACD51AFB9204008FA782 /* AppDelegate.swift */ = {isa = PBXFileReference; lastKnownFileType = sourcecode.swift; path = AppDelegate.swift; sourceTree = ""; }; @@ -111,6 +113,7 @@ 607FACD51AFB9204008FA782 /* AppDelegate.swift */, 607FACD71AFB9204008FA782 /* ViewController.swift */, 4978479D1DD88148003CFFBB /* AnalysisTableViewController.swift */, + 4985BEC01DF1959500B36F51 /* UIViewController+Safari.swift */, 607FACD91AFB9204008FA782 /* Main.storyboard */, 4978479B1DD87E4A003CFFBB /* Analysis.storyboard */, 607FACDC1AFB9204008FA782 /* Images.xcassets */, @@ -370,6 +373,7 @@ files = ( 607FACD81AFB9204008FA782 /* ViewController.swift in Sources */, 607FACD61AFB9204008FA782 /* AppDelegate.swift in Sources */, + 4985BEC11DF1959500B36F51 /* UIViewController+Safari.swift in Sources */, 4978479E1DD88148003CFFBB /* AnalysisTableViewController.swift in Sources */, ); runOnlyForDeploymentPostprocessing = 0; diff --git a/Example/Analysis/Analysis.storyboard b/Example/Analysis/Analysis.storyboard index 42ebdb2..a6654f0 100644 --- a/Example/Analysis/Analysis.storyboard +++ b/Example/Analysis/Analysis.storyboard @@ -21,21 +21,21 @@ - + - + - + - + - + - + - + - + - + - + + + + + + + + + + + + +