summaryrefslogtreecommitdiff
path: root/Userland/Utilities/sort.cpp
blob: 02c28a4e557b743189edfb0c4f54e7fea913b85c (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
/*
 * Copyright (c) 2018-2020, Andreas Kling <kling@serenityos.org>
 * Copyright (c) 2022, Peter Elliott <pelliott@serenityos.org>
 *
 * SPDX-License-Identifier: BSD-2-Clause
 */

#include <AK/DeprecatedString.h>
#include <AK/HashMap.h>
#include <AK/QuickSort.h>
#include <AK/Vector.h>
#include <LibCore/ArgsParser.h>
#include <LibCore/File.h>
#include <LibCore/System.h>
#include <LibMain/Main.h>
#include <ctype.h>

struct Line {
    StringView key;
    long int numeric_key;
    DeprecatedString line;
    bool numeric;

    bool operator<(Line const& other) const
    {
        if (numeric)
            return numeric_key < other.numeric_key;

        return key < other.key;
    }

    bool operator==(Line const& other) const
    {
        if (numeric)
            return numeric_key == other.numeric_key;

        return key == other.key;
    }

private:
};

template<>
struct AK::Traits<Line> : public GenericTraits<Line> {
    static unsigned hash(Line l)
    {
        if (l.numeric)
            return l.numeric_key;

        return l.key.hash();
    }
};

struct Options {
    size_t key_field { 0 };
    bool unique { false };
    bool numeric { false };
    StringView separator { "\0", 1 };
    Vector<DeprecatedString> files;
};

static ErrorOr<void> load_file(Options options, StringView filename, Vector<Line>& lines, HashTable<Line>& seen)
{
    auto file = TRY(Core::BufferedFile::create(
        TRY(Core::File::open_file_or_standard_stream(filename, Core::File::OpenMode::Read))));

    // FIXME: Unlimited line length
    auto buffer = TRY(ByteBuffer::create_uninitialized(4096));
    while (TRY(file->can_read_line())) {
        DeprecatedString line = TRY(file->read_line(buffer));

        StringView key = line;
        if (options.key_field != 0) {
            auto split = (options.separator[0])
                ? line.split_view(options.separator[0])
                : line.split_view(isspace);
            if (options.key_field - 1 >= split.size()) {
                key = ""sv;
            } else {
                key = split[options.key_field - 1];
            }
        }

        Line l = { key, key.to_int().value_or(0), line, options.numeric };

        if (!options.unique || !seen.contains(l)) {
            lines.append(l);
            if (options.unique)
                seen.set(l);
        }
    }

    return {};
}

ErrorOr<int> serenity_main([[maybe_unused]] Main::Arguments arguments)
{
    TRY(Core::System::pledge("stdio rpath"));

    Options options;

    Core::ArgsParser args_parser;
    args_parser.add_option(options.key_field, "The field to sort by", "key-field", 'k', "keydef");
    args_parser.add_option(options.unique, "Don't emit duplicate lines", "unique", 'u');
    args_parser.add_option(options.numeric, "treat the key field as a number", "numeric", 'n');
    args_parser.add_option(options.separator, "The separator to split fields by", "sep", 't', "char");
    args_parser.add_positional_argument(options.files, "Files to sort", "file", Core::ArgsParser::Required::No);
    args_parser.parse(arguments);

    Vector<Line> lines;
    HashTable<Line> seen;

    if (options.files.size() == 0) {
        TRY(load_file(options, "-"sv, lines, seen));
    } else {
        for (auto& file : options.files) {
            TRY(load_file(options, file, lines, seen));
        }
    }

    quick_sort(lines);

    for (auto& line : lines) {
        outln("{}", line.line);
    }

    return 0;
}