versioninfo()

Julia Version 1.10.2
Commit bd47eca2c8a (2024-03-01 10:14 UTC)
Build Info:
  Official https://julialang.org/ release
Platform Info:
  OS: Linux (x86_64-linux-gnu)
  CPU: 32 × Intel(R) Xeon(R) CPU E5-2630 v3 @ 2.40GHz
  WORD_SIZE: 64
  LIBM: libopenlibm
  LLVM: libLLVM-15.0.7 (ORCJIT, haswell)
Threads: 1 default, 0 interactive, 1 GC (on 32 virtual cores)
Environment:
  JULIA_PKG_SERVER = https://mirrors.tuna.tsinghua.edu.cn/julia

# set the output format of gr backend to png while the default is svg, which disappears in jupyter pages (after restart).
# StatsPlots has an identical gr() function.
@time using Plots;
#gr(fmt = "png")
@time gr(fmt = :png)

@time using StatsPlots; 
@time gr(fmt = :png)

  2.011342 seconds (1.31 M allocations: 81.792 MiB, 0.95% gc time, 10.53% compilation time: 89% of which was recompilation)
  0.000050 seconds (5 allocations: 576 bytes)
  1.449801 seconds (771.83 k allocations: 39.546 MiB, 8.81% gc time, 1.66% compilation time: 100% of which was recompilation)
  0.000038 seconds (5 allocations: 576 bytes)

Plots.GRBackend()

using Distributions;
beta = Beta(1, 1);
@show pdf(beta, 0);
dirichlet = Dirichlet([1, 1]);
@show pdf(dirichlet, [0, 1]);

pdf(beta, 0) = 1.0
pdf(dirichlet, [0, 1]) = 1.0

# test for impossible values
@show @time pdf(beta, -0.5);
@show @time pdf(dirichlet, [-0.5, 1.5]);
@show @time pdf(Dirichlet([1000, 100]), [1, 1]);

  0.004283 seconds (1.25 k allocations: 88.367 KiB, 98.91% compilation time)
#= In[13]:2 =# @time(pdf(beta, -0.5)) = 0.0
  0.088154 seconds (138.02 k allocations: 9.336 MiB, 99.95% compilation time)
#= In[13]:3 =# @time(pdf(dirichlet, [-0.5, 1.5])) = 0.0
  0.000004 seconds (2 allocations: 160 bytes)
#= In[13]:4 =# @time(pdf(Dirichlet([1000, 100]), [1, 1])) = 0.0

using StatsBase;
using Pkg;
Pkg.status("StatsBase")

Status `~/.julia/environments/v1.10/Project.toml`
⌅ [2913bbd2] StatsBase v0.33.21
Info Packages marked with ⌅ have new versions available but compatibility constraints restrict them from upgrading. To see why use `status --outdated`

let counts = zeros(5)
   for _ in 1:10^5
       let a = [1, 2, 3, 4, 5]
           for samp in StatsBase.fisher_yates_sample!(a, a)
               counts[samp] += 1
           end
       end
   end
   counts
end

5-element Vector{Float64}:
  20165.0
  65422.0
 104112.0
 138967.0
 171334.0

let counts = zeros(5)
  for _ in 1:10^5
      let a = [1, 2, 3, 4, 5]
            # the destination is a copy of a
           for samp in StatsBase.sample!(copy(a), a, replace=false)
               counts[samp] += 1
           end
      end
  end
  counts
end

5-element Vector{Float64}:
 100000.0
 100000.0
 100000.0
 100000.0
 100000.0

# Now it threw an error.
let counts = zeros(5)
  for _ in 1:10^5
      let a = [1, 2, 3, 4, 5]
            # the destination is a
           for samp in StatsBase.sample!(a, a, replace=false)
               counts[samp] += 1
           end
      end
  end
  counts
end

ArgumentError: output array a must not share memory with input array x

Stacktrace:
 [1] sample!(rng::Random._GLOBAL_RNG, a::Vector{Int64}, x::Vector{Int64}; replace::Bool, ordered::Bool)
   @ StatsBase ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:454
 [2] sample!
   @ ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:452 [inlined]
 [3] sample!
   @ ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:492 [inlined]
 [4] top-level scope
   @ ./In[24]:6

let counts = zeros(5)
  for _ in 1:10^5
      let a = [1, 2, 3, 4, 5]
            # the destination is copy of a
           for samp in StatsBase.sample!(copy(a), a, replace=true)
               counts[samp] += 1
           end
      end
  end
  counts
end

5-element Vector{Float64}:
 100410.0
  99820.0
  99692.0
 100046.0
 100032.0

# throws an error for share-memory sample!()
let counts = zeros(5)
  for _ in 1:10^5
      let a = [1, 2, 3, 4, 5]
            # the destination is a
           for samp in StatsBase.sample!(a, a, replace=true)
               counts[samp] += 1
           end
      end
  end
  counts
end

ArgumentError: output array a must not share memory with input array x

Stacktrace:
 [1] sample!(rng::Random._GLOBAL_RNG, a::Vector{Int64}, x::Vector{Int64}; replace::Bool, ordered::Bool)
   @ StatsBase ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:454
 [2] sample!
   @ ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:452 [inlined]
 [3] sample!
   @ ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:492 [inlined]
 [4] top-level scope
   @ ./In[18]:5

let counts = zeros(5)
  for _ in 1:10^5
      let a = [1, 2, 3, 4, 5]
            # the destination is copy of a
           for samp in StatsBase.sample!(copy(a), a, ordered=true, replace=true)
               counts[samp] += 1
           end
      end
  end
  counts
end

5-element Vector{Float64}:
 100393.0
 100376.0
  99589.0
  99688.0
  99954.0

let counts = zeros(5)
  for _ in 1:10^5
      let a = [1, 2, 3, 4, 5]
            # the destination is a
           for samp in StatsBase.sample!(a, a, ordered=true, replace=true)
               counts[samp] += 1
           end
      end
  end
  counts
end

ArgumentError: output array a must not share memory with input array x

Stacktrace:
 [1] sample!(rng::Random._GLOBAL_RNG, a::Vector{Int64}, x::Vector{Int64}; replace::Bool, ordered::Bool)
   @ StatsBase ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:454
 [2] sample!
   @ ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:452 [inlined]
 [3] sample!
   @ ~/.julia/packages/StatsBase/XgjIN/src/sampling.jl:492 [inlined]
 [4] top-level scope
   @ ./In[20]:5

@time prod([Int8(100), Int8(100)])

  0.000003 seconds (1 allocation: 64 bytes)

10000

@time prod((Int8(100), Int8(100)))

  0.000000 seconds

10000

using StatsBase

fit(Histogram, [1 for _ in 1:1000])

Histogram{Int64, 1, Tuple{StepRangeLen{Float64, Base.TwicePrecision{Float64}, Base.TwicePrecision{Float64}, Int64}}}
edges:
  1.0:1.0:2.0
weights: [1000]
closed: left
isdensity: false

fit(Histogram, [1.234 for _ in 1:1000])

Histogram{Int64, 1, Tuple{StepRangeLen{Float64, Base.TwicePrecision{Float64}, Base.TwicePrecision{Float64}, Int64}}}
edges:
  1.234:1.0:2.234
weights: [1000]
closed: left
isdensity: false

# one more test
fit(Histogram, rand(100))

Histogram{Int64, 1, Tuple{StepRangeLen{Float64, Base.TwicePrecision{Float64}, Base.TwicePrecision{Float64}, Int64}}}
edges:
  0.0:0.2:1.0
weights: [15, 19, 18, 25, 23]
closed: left
isdensity: false

sum!(R::AbstractArray, A::AbstractArray,
      w::AbstractWeights{<:Real}, dim::Int;
      init::Bool=true)

a = [1 2 3];
@show sum!(copy(a), a)
println("a=", a)

@show sum!(a, a)
println("a=", a)

a = [1 2 3];
@show sum!(a, a, init=false)

a = [1 2 3];
@show prod!(copy(a), a)
println("a=", a)

a = [1 2 3];
@show prod!(a, a)
println("a=", a)

a = [1 2 3];
@show prod!(a, a, init=false)
println("a=", a)

sum!(copy(a), a) = [1 2 3]
a=[1 2 3]
sum!(a, a) = [0 0 0]
a=[0 0 0]
sum!(a, a, init = false) = [2 4 6]
prod!(copy(a), a) = [1 2 3]
a=[1 2 3]
prod!(a, a) = [1 1 1]
a=[1 1 1]
prod!(a, a, init = false) = [1 4 9]
a=[1 4 9]

# cumsum!() returns correct result.
a = [1, 2, 3];
@show cumsum!(a, a)
println("a=",a)

cumsum!(a, a) = [1, 3, 6]
a=[1, 3, 6]

let a = [true, false]
   any!(a, a)
end

2-element Vector{Bool}:
 0
 0

let a = [true, false]
   any!(copy(a), a)
end

2-element Vector{Bool}:
 1
 0

let a = [true, false]
   all!(a, a)
end

2-element Vector{Bool}:
 1
 1

let a = [true, false]
   all!(copy(a), a)
end

2-element Vector{Bool}:
 1
 0

G = [49, 14, 11, 6, 2, 1, 3, 2, 1, 3, 0, 1, 2, 2, 1, 0, 1, 1, 1, 0, 2, 1, 1, 2, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1]
ΔG = length(G)
degG = Dict(i => count(node -> node ≥ i, G) for i in 1:ΔG);
degG′ = sort(degG);

degG[626]

0

degG′[626]

0

@show 626 ∈ keys(degG′)
@show 626 ∈ collect(keys(degG′))

626 ∈ keys(degG′) = true
626 ∈ collect(keys(degG′)) = true

true

1 Incorrect probability density from different forms of the same distribution: Beta(1,1) vs Dirichlet([1,1])¶

2 Sampling is biased when the destination array is equal to the sampled array.¶

3 The product function can produce incorrect results for 8-bit, 16-bit, and 32-bit integers¶

4 Incorrect Histogram fit for arrays of equal Float64 values¶

5 sum!, prod!, any!, and all! may silently return incorrect results #39385¶

7 OrderedDict corrupted keys¶