|
|
|
|
@@ -3,8 +3,9 @@ module util
|
|
|
|
|
export timedifference, showstracktrace, findHighestIndexKey, uuid4snakecase, replaceDictKeys,
|
|
|
|
|
findMatchingDictKey, textToDict, randstring, randstrings, timeout,
|
|
|
|
|
dataframeToCSV, dfToVectorDict, disintegrate_vectorDict, getDataFrameValue, dfRowtoString,
|
|
|
|
|
dfToString, dataframe_to_json_list, dict_to_string, extract_triple_backtick_text,
|
|
|
|
|
countGivenWords, remove_french_accents, detect_keyword
|
|
|
|
|
dfToString, dataframe_to_json_list, dictToString, dictToString_noKey,
|
|
|
|
|
dictToString_numbering, extract_triple_backtick_text,
|
|
|
|
|
countGivenWords, remove_french_accents, detect_keyword, extractTextBetweenCharacter
|
|
|
|
|
|
|
|
|
|
using JSON3, DataStructures, Distributions, Random, Dates, UUIDs, MQTTClient, DataFrames
|
|
|
|
|
|
|
|
|
|
@@ -479,7 +480,7 @@ end
|
|
|
|
|
function dfToVectorDict(df::DataFrame)
|
|
|
|
|
vec = []
|
|
|
|
|
for row in eachrow(df)
|
|
|
|
|
d = Dict{String, Any}()
|
|
|
|
|
d = DataStructures.OrderedDict{String, Any}()
|
|
|
|
|
for col in names(df)
|
|
|
|
|
d[col] = row[col]
|
|
|
|
|
end
|
|
|
|
|
@@ -709,7 +710,15 @@ end
|
|
|
|
|
|
|
|
|
|
# Signature
|
|
|
|
|
"""
|
|
|
|
|
function dict_to_string(od::T) where {T<:AbstractDict}
|
|
|
|
|
function dictToString(od::T) where {T<:AbstractDict}
|
|
|
|
|
items = []
|
|
|
|
|
for (i, (key, value)) in enumerate(od)
|
|
|
|
|
push!(items, "$key: $value")
|
|
|
|
|
end
|
|
|
|
|
return join(items, ", ")
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
function dictToString_numbering(od::T) where {T<:AbstractDict}
|
|
|
|
|
items = []
|
|
|
|
|
for (i, (key, value)) in enumerate(od)
|
|
|
|
|
push!(items, "$i) $key: $value")
|
|
|
|
|
@@ -717,6 +726,14 @@ function dict_to_string(od::T) where {T<:AbstractDict}
|
|
|
|
|
return join(items, ", ")
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
function dictToString_noKey(od::T) where {T<:AbstractDict}
|
|
|
|
|
items = []
|
|
|
|
|
for (i, (key, value)) in enumerate(od)
|
|
|
|
|
push!(items, "$value")
|
|
|
|
|
end
|
|
|
|
|
return join(items, ", ")
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
"""
|
|
|
|
|
extract_triple_backtick_text(text::String) -> Vector{String}
|
|
|
|
|
@@ -730,7 +747,7 @@ Extracts text enclosed within triple backticks (```) from the given string.
|
|
|
|
|
- `Vector{String}`: A vector of strings, each representing a block of text enclosed within triple backticks found in the input string.
|
|
|
|
|
|
|
|
|
|
# Examples:
|
|
|
|
|
```julia
|
|
|
|
|
```jldoctest
|
|
|
|
|
julia> extract_triple_backtick_text("Here is some text ```with a code block``` and more text.")
|
|
|
|
|
1-element Vector{String}:
|
|
|
|
|
"with a code block"
|
|
|
|
|
@@ -762,7 +779,7 @@ Detects if a keyword exists in the text in different case variations (lowercase,
|
|
|
|
|
- `Union{Nothing, String}`: Returns the matched keyword variation if found, otherwise returns nothing
|
|
|
|
|
|
|
|
|
|
# Examples:
|
|
|
|
|
```julia
|
|
|
|
|
```jldoctest
|
|
|
|
|
julia> detect_keyword("test", "This is a Test case")
|
|
|
|
|
"Test"
|
|
|
|
|
|
|
|
|
|
@@ -804,7 +821,7 @@ Count the occurrences of each word in the given list within the provided text.
|
|
|
|
|
- `Vector{Int64}`: Their respective counts in the `text`.
|
|
|
|
|
|
|
|
|
|
# Examples
|
|
|
|
|
```julia
|
|
|
|
|
```jldoctest
|
|
|
|
|
julia> GeneralUtils.countGivenWords("hello world hello", ["hello", "world"])
|
|
|
|
|
2-element Vector{Int64}:
|
|
|
|
|
2
|
|
|
|
|
@@ -846,7 +863,7 @@ Remove French accents from the given text.
|
|
|
|
|
- `String`: The input string with all French accents removed.
|
|
|
|
|
|
|
|
|
|
# Examples
|
|
|
|
|
```julia
|
|
|
|
|
```jldoctest
|
|
|
|
|
julia> remove_french_accents("Café")
|
|
|
|
|
"Cafe"
|
|
|
|
|
|
|
|
|
|
@@ -890,6 +907,44 @@ function remove_french_accents(text::AbstractString)::AbstractString
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
"""
|
|
|
|
|
extractTextBetweenCharacters(text::String, start_char::Char, end_char::Char)::String
|
|
|
|
|
|
|
|
|
|
Extracts and returns the text that is enclosed between two specified characters within a given string.
|
|
|
|
|
|
|
|
|
|
# Arguments:
|
|
|
|
|
- `text::String`: The input string from which to extract the text.
|
|
|
|
|
- `startchar::Char`: The starting character that marks the beginning of the desired text.
|
|
|
|
|
- `endchar::Char`: The ending character that marks the end of the desired text.
|
|
|
|
|
|
|
|
|
|
# Returns:
|
|
|
|
|
- `String`: The substring enclosed between `start_char` and `end_char`.
|
|
|
|
|
|
|
|
|
|
# Examples:
|
|
|
|
|
```jldoctest
|
|
|
|
|
julia> text = "Hello [World]!"
|
|
|
|
|
julia> extracted_text = extractTextBetweenCharacter(text, '[', ']')
|
|
|
|
|
println(extracted_text) # Output: "World"
|
|
|
|
|
"""
|
|
|
|
|
function extractTextBetweenCharacter(text::String, startchar::Char, endchar::Char)
|
|
|
|
|
result = []
|
|
|
|
|
start_index = 0
|
|
|
|
|
in_braces = false
|
|
|
|
|
|
|
|
|
|
for (i, c) in enumerate(text)
|
|
|
|
|
if c == startchar
|
|
|
|
|
start_index = i + 1
|
|
|
|
|
in_braces = true
|
|
|
|
|
elseif c == endchar
|
|
|
|
|
if in_braces
|
|
|
|
|
push!(result, text[start_index:i-1])
|
|
|
|
|
in_braces = false
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
return result
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|