source: icGREP/icgrep-devel/icgrep/lz4_grep.cpp @ 6104

Last change on this file since 6104 was 6081, checked in by xwa163, 13 months ago
  1. Add command line parameter -enable-gather and -enable-scatter in lz4 parallel grep
  2. fix some bugs for AVX512 machine
File size: 5.0 KB
Line 
1/*
2 *  Copyright (c) 2017 International Characters.
3 *  This software is licensed to the public under the Open Software License 3.0.
4 *  icgrep is a trademark of International Characters.
5 */
6
7
8#include <llvm/IR/Module.h>
9#include <llvm/Linker/Linker.h>
10#include <llvm/Support/PrettyStackTrace.h>
11#include <llvm/Support/Signals.h>
12#include <llvm/Support/ManagedStatic.h>
13#include <IR_Gen/idisa_target.h>
14#include <boost/filesystem.hpp>
15#include <boost/iostreams/device/mapped_file.hpp>
16
17#include <lz4FrameDecoder.h>
18#include <cc/cc_compiler.h>
19#include <toolchain/toolchain.h>
20#include <kernels/cc_kernel.h>
21#include <kernels/streamset.h>
22#include <kernels/s2p_kernel.h>
23#include <kernels/kernel_builder.h>
24#include <toolchain/cpudriver.h>
25
26#include <iostream>
27#include <lz4/LZ4GrepGenerator.h>
28
29
30#include <re/re_alt.h>
31#include <re/re_start.h>
32#include <re/re_end.h>
33#include <re/re_utility.h>
34#include <re/re_toolchain.h>
35#include <pablo/pablo_toolchain.h>
36#include <llvm/Support/raw_ostream.h>
37
38namespace re { class CC; }
39
40using namespace llvm;
41using namespace parabix;
42using namespace kernel;
43
44static cl::OptionCategory lz4GrepFlags("Command Flags", "lz4d options");
45static cl::opt<std::string> regexString(cl::Positional, cl::desc("<regex>"), cl::Required, cl::cat(lz4GrepFlags));
46static cl::opt<std::string> inputFile(cl::Positional, cl::desc("<input file>"), cl::Required, cl::cat(lz4GrepFlags));
47static cl::opt<bool> countOnly("count-only", cl::desc("Only count the match result"), cl::init(false), cl::cat(lz4GrepFlags));
48static cl::opt<bool> enableMultiplexing("enable-multiplexing", cl::desc("Enable CC multiplexing."), cl::init(false), cl::cat(lz4GrepFlags));
49
50static cl::OptionCategory lz4GrepDebugFlags("LZ4 Grep Debug Flags", "lz4d debug options");
51static cl::opt<bool> aio("aio", cl::desc("Use All-in-One Approach for LZ4 Decompression"), cl::init(false), cl::cat(lz4GrepDebugFlags));
52static cl::opt<bool> parallelDecompression("parallel-decompression", cl::desc("Use parallel Approach for LZ4 Decompression"), cl::init(false), cl::cat(lz4GrepDebugFlags));
53static cl::opt<bool> swizzledDecompression("swizzled-decompression", cl::desc("Use swizzle approach for decompression"), cl::init(false), cl::cat(lz4GrepDebugFlags));
54static cl::opt<bool> enableGather("enable-gather", cl::desc("Enable gather intrinsics"), cl::init(false), cl::cat(lz4GrepDebugFlags));
55static cl::opt<bool> enableScatter("enable-scatter", cl::desc("Enable scatter intrinsics"), cl::init(false), cl::cat(lz4GrepDebugFlags));
56
57
58int main(int argc, char *argv[]) {
59    // This boilerplate provides convenient stack traces and clean LLVM exit
60    // handling. It also initializes the built in support for convenient
61    // command line option handling.
62    sys::PrintStackTraceOnErrorSignal(argv[0]);
63    llvm::PrettyStackTraceProgram X(argc, argv);
64    llvm_shutdown_obj shutdown;
65    codegen::ParseCommandLineOptions(argc, argv, {&lz4GrepFlags, &lz4GrepDebugFlags, codegen::codegen_flags()});
66    std::string fileName = inputFile;
67    LZ4FrameDecoder lz4Frame(fileName);
68    if (!lz4Frame.isValid()) {
69        errs() << "Invalid LZ4 file.\n";
70        return -1;
71    }
72
73    boost::iostreams::mapped_file_source mappedFile;
74    // Since mmap offset has to be multiples of pages, we can't use it to skip headers.
75    mappedFile.open(fileName , lz4Frame.getBlocksLength() + lz4Frame.getBlocksStart());
76    //char *fileBuffer = const_cast<char *>(mappedFile.data()) + lz4Frame.getBlocksStart();
77    char *fileBuffer = const_cast<char *>(mappedFile.data());
78    re::RE * re_ast = re::RE_Parser::parse(regexString, re::MULTILINE_MODE_FLAG);
79    LZ4GrepGenerator g(enableMultiplexing);
80    if (aio) {
81        if (parallelDecompression) {
82            g.generateParallelAioPipeline(re_ast, enableGather, enableScatter);
83        } else if (enableMultiplexing) {
84            g.generateMultiplexingSwizzledAioPipeline2(re_ast);
85        } else if (swizzledDecompression) {
86            g.generateSwizzledAioPipeline(re_ast);
87        } else {
88            g.generateAioPipeline(re_ast);
89        }
90
91        auto main = g.getCountOnlyGrepMainFunction();
92        uint64_t countResult = main(fileBuffer, lz4Frame.getBlocksStart(), lz4Frame.getBlocksStart() + lz4Frame.getBlocksLength(), lz4Frame.hasBlockChecksum());
93        llvm::outs() << countResult << "\n";
94    } else if (countOnly) {
95        if (swizzledDecompression) {
96            g.generateSwizzledCountOnlyGrepPipeline(re_ast);
97        } else {
98            g.generateCountOnlyGrepPipeline(re_ast, enableGather);
99        }
100
101        auto main = g.getCountOnlyGrepMainFunction();
102        uint64_t countResult = main(fileBuffer, lz4Frame.getBlocksStart(), lz4Frame.getBlocksStart() + lz4Frame.getBlocksLength(), lz4Frame.hasBlockChecksum());
103        llvm::outs() << countResult << "\n";
104    } else {
105        g.generateScanMatchGrepPipeline(re_ast);
106        g.invokeScanMatchGrep(fileBuffer, lz4Frame.getBlocksStart(), lz4Frame.getBlocksStart() + lz4Frame.getBlocksLength(), lz4Frame.hasBlockChecksum());
107
108    }
109
110
111    mappedFile.close();
112    return 0;
113}
Note: See TracBrowser for help on using the repository browser.