helium/main_helium.cpp


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66

// Copyright 2006 Google Inc.
// All Rights Reserved.
// Author: <renn@google.com> (Marius Renn)
//
// This is the main file for the core front-end to Helium. It is rather
// simple, and does not provide any debugging information.
// The detected text is output to a file called "text.dat".
//
// Please note, that for image loading, Leptonica is required!
//
// Local includes
#include "color.h"
#include "debugging.h"
#include "image.h"
#include "heliumbinarizer.h"
#include "heliumtextdetector.h"
#include "leptonica.h"
#include "textareas.h"
#include "textrecognition.h"

// C includes
#include <stdlib.h>

using namespace helium;

void ExitWithError(const char* message) {
  ERROR(message);
  exit(-1);
}

int main(int argc, char** argv) {
  // Usage check
  if (argc != 2) ExitWithError("Usage: text_detect <input_file>");
  
  // Init Tesseract
  TextRecognition::Init("../");
  
  // Read input image
  LOG_MSG("Reading file...");
  PIX* input = pixRead(argv[1]);
  if (!input) ExitWithError("Could not open image file!");
  Image image = Leptonica::PixToImage(input);
  if (!image.Valid()) ExitWithError("Error while loading image file!");
  
  // Run text detector
  LOG_MSG("Running Text Detector...");
  HeliumTextDetector detector;
  detector.SetDefaultParameters();
  detector.DetectText(image);
  
  // Setup binarizer
  LOG_MSG("Setting up Binarizer...");
  HeliumBinarizer binarizer(image);
  binarizer.AddClusters(detector.GetClusters());
  
  // Run OCR
  LOG_MSG("OCRing...");
  TextAreas text;
  TextRecognition::RecognizeUsingBinarizer(&binarizer, text);

  // Output Text
  text.WriteDatFile("text.dat");
  LOG_MSG("Done.");
  
  return 0;
};