Index talk:US Copyright Office - Renewal Registrations - 1950.djvu/Reformat
Add topic// This is the code I'm using to reformat these pages.
import java.io._
object Process {
val o = new PrintWriter (new File ("bob")) def outputFormattedData (data : Seq[Seq[(String, Int)]]) : Unit = { //println (data) val chunk = (data.head +: data.tail.takeWhile (_.head._1.isEmpty)).toVector println (chunk) for (ch <- chunk) { for (c <- ch) { if (c._1.isEmpty) {o.println(""); o.print (":")} else o.print (c._1 + " ") } } o.println ("") o.println ("") println (data.tail) if (!data.tail.isEmpty) outputFormattedData (data.tail.dropWhile (_.head._1.isEmpty)) else o.close() }
def allTails[T] (s : Seq[T], bp : T => Boolean) : Seq[Seq[T]] = { if (s.isEmpty) Seq() else if (bp(s.head)) s +: allTails(s.tail, bp) else allTails(s.tail, bp) }
def main(args: Array[String]): Unit = { val file = { if (args.isEmpty) "sample" else args(0)} val lines = io.Source.fromFile(file).getLines.toVector val processedData = allTails ( lines.map (l => (l.dropWhile(_ == ' '), l.takeWhile(_ == ' ').length)), {x : (String, Int) => (x._2 == 0)} ).map {x => (x.head +: x.tail.takeWhile (_._2 != 0)) }.filter (l => l.length != 1 || (l.head._1 != "")) outputFormattedData (processedData.toVector) }
}
Public domainPublic domainfalsefalse
The standard Wikisource licenses apply to the original work of the contributor(s).
This work is licensed under the terms of the GNU Free Documentation License.
Public domainPublic domainfalsefalse
This work is released under the Creative Commons Attribution-ShareAlike 3.0 Unported license, which allows free use, distribution, and creation of derivatives, so long as the license is unchanged and clearly noted, and the original author is attributed.
Public domainPublic domainfalsefalse
Start a discussion about Index:US Copyright Office - Renewal Registrations - 1950.djvu/Reformat
Talk pages are where people discuss how to make content on Wikisource the best that it can be. You can use this page to start a discussion with others about how to improve Index:US Copyright Office - Renewal Registrations - 1950.djvu/Reformat.