Another one line, this time with numpy.where:
out = {v: np.where(v == a)[0] for v in numpy.unique(a)}
(For some applications, a logical array is sufficient:
out = {v: v == a for v in numpy.unique(a)}
)
Please note that it is numpy.uniquefaster than set()for large arrays, and a large margin if there are only a few unique entries.
Anyway, for most array sizes, this is the fastest way:
10 different integers:

100 :

:
import numpy as np
from collections import defaultdict
import perfplot
def pp(a):
index = np.argsort(a, kind='mergesort')
as_ = a[index]
jumps = np.r_[0, 1 + np.where(np.diff(as_) != 0)[0]]
pp_out = {k: v for k, v in zip(as_[jumps], np.split(index, jumps[1:]))}
return pp_out
def pp2(a):
index = np.argsort(a)
as_ = a[index]
jumps = np.r_[0, 1 + np.where(np.diff(as_) != 0)[0]]
pp_out = {k: np.sort(v)
for k, v in zip(as_[jumps], np.split(index, jumps[1:]))}
return pp_out
def Denziloe_JFFabre(a):
df_out = {v: [i for i, x in enumerate(a) if x == v] for v in np.unique(a)}
return df_out
def FCouzo(a):
fc_out = defaultdict(list)
for i, elem in enumerate(a):
fc_out[elem].append(i)
return fc_out
def KKSingh(a):
kks_out = defaultdict(list)
list(map(lambda x: kks_out[x[0]].append(x[1]), zip(a, range(len(a)))))
return kks_out
def TMcDonaldJensen(a):
mdj_out = defaultdict(list)
for i, elem in enumerate(a):
mdj_out[elem].append(i)
return mdj_out
def RomanPerekhrest(a):
rp_out = {}
for k, m in enumerate(a):
rp_out.setdefault(m, []).append(k)
return rp_out
def SchloemerHist(a):
np.histogram(a, bins=np.arange(min(a), max(a)+2))
return
def SchloemerWhere(a):
out = {v: np.where(v == a)[0] for v in np.unique(a)}
return out
def SchloemerBooleanOnly(a):
out = {v: v == a for v in np.unique(a)}
return out
perfplot.show(
setup=lambda n: np.random.randint(0, 100, n),
kernels=[
pp, pp2, Denziloe_JFFabre, FCouzo, KKSingh,
TMcDonaldJensen, RomanPerekhrest, SchloemerHist, SchloemerWhere,
SchloemerBooleanOnly
],
n_range=[2**k for k in range(17)],
xlabel='len(a)',
logx=True,
logy=True,
)