source: icGREP/icgrep-devel/icgrep/lz4_grep.cpp @ 6059

Last change on this file since 6059 was 6059, checked in by xwa163, 12 months ago
  1. Enable swizzled match copy in multiplexing lz4_grep for some special case
  2. Implement some lz4 AIO (all-in-one) pipeline and related kernel
File size: 4.4 KB
Line 
1/*
2 *  Copyright (c) 2017 International Characters.
3 *  This software is licensed to the public under the Open Software License 3.0.
4 *  icgrep is a trademark of International Characters.
5 */
6
7
8#include <llvm/IR/Module.h>
9#include <llvm/Linker/Linker.h>
10#include <llvm/Support/PrettyStackTrace.h>
11#include <llvm/Support/Signals.h>
12#include <llvm/Support/ManagedStatic.h>
13#include <IR_Gen/idisa_target.h>
14#include <boost/filesystem.hpp>
15#include <boost/iostreams/device/mapped_file.hpp>
16
17#include <lz4FrameDecoder.h>
18#include <cc/cc_compiler.h>
19#include <toolchain/toolchain.h>
20#include <kernels/cc_kernel.h>
21#include <kernels/streamset.h>
22#include <kernels/s2p_kernel.h>
23#include <kernels/kernel_builder.h>
24#include <toolchain/cpudriver.h>
25
26#include <iostream>
27#include <lz4/LZ4GrepGenerator.h>
28
29
30#include <re/re_alt.h>
31#include <re/re_start.h>
32#include <re/re_end.h>
33#include <re/re_utility.h>
34#include <re/re_toolchain.h>
35#include <pablo/pablo_toolchain.h>
36#include <llvm/Support/raw_ostream.h>
37
38namespace re { class CC; }
39
40using namespace llvm;
41using namespace parabix;
42using namespace kernel;
43
44static cl::OptionCategory lz4GrepFlags("Command Flags", "lz4d options");
45static cl::opt<std::string> regexString(cl::Positional, cl::desc("<regex>"), cl::Required, cl::cat(lz4GrepFlags));
46static cl::opt<std::string> inputFile(cl::Positional, cl::desc("<input file>"), cl::Required, cl::cat(lz4GrepFlags));
47static cl::opt<bool> countOnly("count-only", cl::desc("Only count the match result"), cl::init(false), cl::cat(lz4GrepFlags));
48static cl::opt<bool> enableMultiplexing("enable-multiplexing", cl::desc("Enable CC multiplexing."), cl::init(false), cl::cat(lz4GrepFlags));
49
50static cl::OptionCategory lz4GrepDebugFlags("LZ4 Grep Debug Flags", "lz4d debug options");
51static cl::opt<bool> aio("aio", cl::desc("Use All-in-One Approach for LZ4 Decompression"), cl::init(false), cl::cat(lz4GrepDebugFlags));
52static cl::opt<bool> swizzledDecompression("swizzled-decompression", cl::desc("Use swizzle approach for decompression"), cl::init(false), cl::cat(lz4GrepDebugFlags));
53static cl::opt<bool> enableGather("enable-gather", cl::desc("Enable gather intrinsics for bitstream PDEP"), cl::init(false), cl::cat(lz4GrepDebugFlags));
54
55
56int main(int argc, char *argv[]) {
57    // This boilerplate provides convenient stack traces and clean LLVM exit
58    // handling. It also initializes the built in support for convenient
59    // command line option handling.
60    sys::PrintStackTraceOnErrorSignal(argv[0]);
61    llvm::PrettyStackTraceProgram X(argc, argv);
62    llvm_shutdown_obj shutdown;
63    codegen::ParseCommandLineOptions(argc, argv, {&lz4GrepFlags, &lz4GrepDebugFlags, codegen::codegen_flags()});
64    std::string fileName = inputFile;
65    LZ4FrameDecoder lz4Frame(fileName);
66    if (!lz4Frame.isValid()) {
67        errs() << "Invalid LZ4 file.\n";
68        return -1;
69    }
70
71    boost::iostreams::mapped_file_source mappedFile;
72    // Since mmap offset has to be multiples of pages, we can't use it to skip headers.
73    mappedFile.open(fileName , lz4Frame.getBlocksLength() + lz4Frame.getBlocksStart());
74    //char *fileBuffer = const_cast<char *>(mappedFile.data()) + lz4Frame.getBlocksStart();
75    char *fileBuffer = const_cast<char *>(mappedFile.data());
76    re::RE * re_ast = re::RE_Parser::parse(regexString, re::MULTILINE_MODE_FLAG);
77    LZ4GrepGenerator g(enableMultiplexing);
78    if (aio) {
79        if (enableMultiplexing) {
80            g.generateMultiplexingSwizzledAioPipeline2(re_ast);
81        } else if (swizzledDecompression) {
82            g.generateSwizzledAioPipeline(re_ast);
83        } else {
84            g.generateAioPipeline(re_ast);
85        }
86
87        auto main = g.getMainFunc();
88        main(fileBuffer, lz4Frame.getBlocksStart(), lz4Frame.getBlocksStart() + lz4Frame.getBlocksLength(), lz4Frame.hasBlockChecksum());
89    } else if (countOnly) {
90        if (swizzledDecompression) {
91            g.generateSwizzledCountOnlyGrepPipeline(re_ast);
92        } else {
93            g.generateCountOnlyGrepPipeline(re_ast, enableGather);
94        }
95
96        auto main = g.getMainFunc();
97        main(fileBuffer, lz4Frame.getBlocksStart(), lz4Frame.getBlocksStart() + lz4Frame.getBlocksLength(), lz4Frame.hasBlockChecksum());
98    } else {
99        g.generateScanMatchGrepPipeline(re_ast);
100        g.invokeScanMatchGrep(fileBuffer, lz4Frame.getBlocksStart(), lz4Frame.getBlocksStart() + lz4Frame.getBlocksLength(), lz4Frame.hasBlockChecksum());
101
102    }
103
104
105    mappedFile.close();
106    return 0;
107}
Note: See TracBrowser for help on using the repository browser.