Browse Source

Added split text functionality.

master
Craig Oates 6 years ago
parent
commit
12a4b2c813
  1. 8
      WetPancake/DataCleaning.fs
  2. 4
      WetPancake/Script.fsx

8
WetPancake/DataCleaning.fs

@ -1,6 +1,8 @@
module internal DataCleaning
open System.IO
open System.Text.RegularExpressions
open System.IO
open System.Text.RegularExpressions
let ReplaceArtifact pattern text = Regex.Replace(text, pattern, " ")
let ReplaceArtifact pattern text = Regex.Replace(text, pattern, " ")
let SplitText pattern text = Regex.Split(text, pattern)

4
WetPancake/Script.fsx

@ -20,6 +20,7 @@ let ss_item =
let items = seq{1 .. 10}
PickRandomItem (Random().Next) items
// Data Access
let da_sampleFilePath = CreateSampleTextFilesPath
let da_sampleTextFiles = FindSampleTextFiles da_sampleFilePath
@ -38,4 +39,5 @@ let dc_replace5 =
|> ReplaceArtifact "\""
|> ReplaceArtifact "\n\nIn"
|> ReplaceArtifact "\r"
|> ReplaceArtifact "\n"
|> ReplaceArtifact "\n"
let dc_split = SplitText @"\s+" "This is a test string."
Loading…
Cancel
Save