deedrop1140's picture
Upload 41 files
0d00d62 verified
{
"title": "DBSCAN Mastery: 100 MCQs",
"description": "A comprehensive set of 100 multiple-choice questions designed to test and deepen your understanding of DBSCAN (Density-Based Spatial Clustering of Applications with Noise), covering fundamental concepts, parameters, advantages, limitations, and practical scenarios.",
"questions": [
{
"id": 1,
"questionText": "What is the main idea behind DBSCAN clustering?",
"options": [
"Clusters are dense regions separated by sparse regions",
"All points are assigned to a cluster",
"Clusters are linearly separable",
"Clusters are formed by equal-sized groups"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN identifies clusters based on density: areas with many points form clusters, and sparse regions separate them."
},
{
"id": 2,
"questionText": "DBSCAN requires which key parameters?",
"options": [
"Number of clusters (k) only",
"Learning rate and iterations",
"Distance metric only",
"Epsilon (eps) and Minimum points (minPts)"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN uses eps (neighborhood radius) and minPts (minimum points to form a dense region) to define clusters."
},
{
"id": 3,
"questionText": "In DBSCAN, what is a 'core point'?",
"options": [
"Point on the boundary of clusters",
"Point with no neighbors",
"Point with at least minPts neighbors within eps",
"Any point in the dataset"
],
"correctAnswerIndex": 2,
"explanation": "A core point has enough neighboring points within eps to be considered part of a dense cluster."
},
{
"id": 4,
"questionText": "In DBSCAN, what is a 'border point'?",
"options": [
"Point not in any cluster",
"Point reachable from a core point but with fewer than minPts neighbors",
"Point with more than minPts neighbors",
"Centroid of a cluster"
],
"correctAnswerIndex": 1,
"explanation": "Border points are density-reachable from core points but do not have enough neighbors themselves to be core points."
},
{
"id": 5,
"questionText": "In DBSCAN, what is a 'noise point'?",
"options": [
"Point with maximum density",
"Point on the cluster centroid",
"Point with exactly minPts neighbors",
"Point not reachable from any core point"
],
"correctAnswerIndex": 3,
"explanation": "Noise points are isolated points that do not belong to any cluster."
},
{
"id": 6,
"questionText": "Scenario: You have clusters of varying density. Challenge for DBSCAN?",
"options": [
"DBSCAN fails to run",
"Always finds all clusters perfectly",
"Clusters become linearly separable",
"May merge dense clusters and miss sparse ones"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN struggles with clusters of differing densities because eps and minPts are global parameters."
},
{
"id": 7,
"questionText": "Scenario: Choosing eps too large. Effect?",
"options": [
"Algorithm fails",
"Noise increases",
"More clusters detected",
"Clusters may merge; noise reduced"
],
"correctAnswerIndex": 3,
"explanation": "Large eps connects distant points, possibly merging distinct clusters."
},
{
"id": 8,
"questionText": "Scenario: Choosing eps too small. Effect?",
"options": [
"Clusters merge",
"Many points labeled as noise; clusters fragmented",
"No effect",
"EM applied instead"
],
"correctAnswerIndex": 1,
"explanation": "Small eps results in fewer neighbors; many points cannot form clusters and are marked as noise."
},
{
"id": 9,
"questionText": "Scenario: Setting minPts too high. Effect?",
"options": [
"Clusters merge",
"More points labeled as noise; small clusters ignored",
"Algorithm fails",
"Clusters increase"
],
"correctAnswerIndex": 1,
"explanation": "High minPts requires dense regions to form clusters, excluding smaller or sparse clusters."
},
{
"id": 10,
"questionText": "Scenario: Setting minPts too low. Effect?",
"options": [
"DBSCAN fails",
"Clusters disappear",
"Many small clusters; noise reduced",
"Clusters merge automatically"
],
"correctAnswerIndex": 2,
"explanation": "Low minPts allows small groups to form clusters, potentially splitting natural clusters."
},
{
"id": 11,
"questionText": "Scenario: A border point is connected to multiple core points of different clusters. How is it assigned?",
"options": [
"Becomes noise automatically",
"Forms a new cluster",
"Assigned to any one cluster arbitrarily or first reachable",
"Algorithm fails"
],
"correctAnswerIndex": 2,
"explanation": "Border points can belong to one cluster; usually assigned to the first core point that reaches it."
},
{
"id": 12,
"questionText": "Scenario: You have 2D spatial data with noise. DBSCAN advantage?",
"options": [
"Detects clusters of arbitrary shape and identifies noise",
"Requires clusters to be circular",
"Sensitive to number of clusters parameter",
"Assigns all points to clusters"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN works well for arbitrary shapes and identifies noise points."
},
{
"id": 13,
"questionText": "Scenario: Using Euclidean distance vs Manhattan distance in DBSCAN. Effect?",
"options": [
"Distance metric affects cluster shapes and eps choice",
"DBSCAN fails",
"No effect; clusters same",
"Noise ignored"
],
"correctAnswerIndex": 0,
"explanation": "Different distance metrics affect neighborhood calculation, which can change clustering."
},
{
"id": 14,
"questionText": "Scenario: DBSCAN applied on high-dimensional data. Challenge?",
"options": [
"Distance measures become less meaningful (curse of dimensionality)",
"Algorithm runs faster",
"Clusters automatically reduce",
"Noise decreases"
],
"correctAnswerIndex": 0,
"explanation": "High dimensions can make points appear equidistant, complicating density estimation."
},
{
"id": 15,
"questionText": "Scenario: You have concentric clusters. DBSCAN challenge?",
"options": [
"May fail to separate inner and outer clusters depending on eps",
"Always separates perfectly",
"Clusters merge automatically",
"Noise increases"
],
"correctAnswerIndex": 0,
"explanation": "Density difference between inner and outer rings may cause DBSCAN to merge or mislabel clusters."
},
{
"id": 16,
"questionText": "Scenario: Using DBSCAN for geospatial clustering. Advantage?",
"options": [
"Finds clusters of arbitrary shape like regions or neighborhoods",
"Clusters must be circular",
"All points assigned",
"Sensitive to number of clusters"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN can identify irregularly shaped spatial clusters without specifying cluster count."
},
{
"id": 17,
"questionText": "Scenario: You want clusters of varying density. DBSCAN limitation?",
"options": [
"Noise removed automatically",
"Single global eps may not detect all clusters",
"Algorithm adapts automatically",
"All clusters found"
],
"correctAnswerIndex": 1,
"explanation": "DBSCAN uses a fixed eps, which can miss sparse clusters or merge dense clusters."
},
{
"id": 18,
"questionText": "Scenario: You apply DBSCAN on streaming data. Challenge?",
"options": [
"Noise ignored",
"Automatically updates clusters",
"All points reassigned automatically",
"Standard DBSCAN is static; streaming adaptation required"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN is not incremental; modifications are needed for dynamic/streaming data."
},
{
"id": 19,
"questionText": "Scenario: Using DBSCAN for anomaly detection. Approach?",
"options": [
"Assign random labels",
"Label points not in any cluster as anomalies",
"Clusters merged manually",
"Use all clusters for prediction"
],
"correctAnswerIndex": 1,
"explanation": "Noise points are naturally flagged as outliers."
},
{
"id": 20,
"questionText": "Scenario: DBSCAN vs K-Means on arbitrary-shaped clusters. Advantage?",
"options": [
"DBSCAN fails for shapes",
"Both perform equally",
"K-Means better for arbitrary shapes",
"DBSCAN can capture non-spherical clusters; K-Means cannot"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN works with clusters of any shape without requiring centroids."
},
{
"id": 21,
"questionText": "Scenario: Two clusters are close together but separated by sparse points. DBSCAN outcome?",
"options": [
"Fails to converge",
"Marks everything as noise",
"Correctly separates clusters using density differences",
"Merges clusters automatically"
],
"correctAnswerIndex": 2,
"explanation": "Sparse points allow DBSCAN to distinguish dense clusters even if they are close."
},
{
"id": 22,
"questionText": "Scenario: Applying DBSCAN on 3D point cloud data. Advantage?",
"options": [
"Clusters must be spherical",
"All points assigned to clusters",
"Can find clusters of arbitrary 3D shape and ignore noise",
"Requires predefining cluster centers"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN handles multi-dimensional data and can identify irregular clusters and noise."
},
{
"id": 23,
"questionText": "Scenario: DBSCAN uses Manhattan distance on grid data. Effect?",
"options": [
"Algorithm fails",
"Noise increases automatically",
"Clusters align with grid; eps choice differs",
"No effect on clusters"
],
"correctAnswerIndex": 2,
"explanation": "Distance metric changes the neighborhood definition, affecting cluster formation."
},
{
"id": 24,
"questionText": "Scenario: You want small but dense clusters. How to set parameters?",
"options": [
"Small eps and appropriate minPts",
"Large eps",
"Ignore parameters",
"Large minPts"
],
"correctAnswerIndex": 0,
"explanation": "Smaller eps ensures that small dense regions form separate clusters."
},
{
"id": 25,
"questionText": "Scenario: You have noisy sensor data. DBSCAN benefit?",
"options": [
"Clusters all points",
"Fails with noise",
"Requires K-Means preprocessing",
"Automatically labels isolated points as noise"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN identifies low-density points as noise, avoiding misclassification."
},
{
"id": 26,
"questionText": "Scenario: Data with hierarchical cluster structure. Limitation of DBSCAN?",
"options": [
"Noise ignored",
"All clusters merged",
"Cannot detect hierarchy; only flat clusters",
"Automatically finds hierarchy"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN provides flat clustering; hierarchical relationships are not captured."
},
{
"id": 27,
"questionText": "Scenario: Using DBSCAN for image segmentation. Advantage?",
"options": [
"Requires predefined number of segments",
"All pixels assigned to clusters",
"Identifies irregular regions and isolates noise",
"Clusters must be circular"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN captures arbitrary-shaped regions and treats background/noisy pixels as noise."
},
{
"id": 28,
"questionText": "Scenario: You have clusters of different densities. How to adapt DBSCAN?",
"options": [
"Reduce dimensionality",
"Use varying eps with methods like HDBSCAN",
"Keep single global eps",
"Increase minPts"
],
"correctAnswerIndex": 1,
"explanation": "Standard DBSCAN struggles with varying densities; adaptive versions like HDBSCAN help."
},
{
"id": 29,
"questionText": "Scenario: DBSCAN fails to detect clusters in high-dimensional text embeddings. Solution?",
"options": [
"Increase minPts arbitrarily",
"Use full covariance",
"Reduce dimensions using PCA or t-SNE before clustering",
"Ignore scaling"
],
"correctAnswerIndex": 2,
"explanation": "Dimensionality reduction improves distance computation and density estimation."
},
{
"id": 30,
"questionText": "Scenario: Choosing minPts in DBSCAN. Rule of thumb?",
"options": [
"MinPts = 1 always",
"MinPts = dataset size",
"MinPts ignored",
"MinPts ≥ dimensionality + 1"
],
"correctAnswerIndex": 3,
"explanation": "MinPts should be slightly larger than the data dimensionality for meaningful clusters."
},
{
"id": 31,
"questionText": "Scenario: DBSCAN applied on GPS data of taxis in a city. Best use case?",
"options": [
"Assign random clusters",
"Identify high-density pickup/drop-off hotspots",
"Detect only circular areas",
"Cluster by taxi color"
],
"correctAnswerIndex": 1,
"explanation": "DBSCAN can detect dense regions where taxis frequently gather without assuming cluster shape."
},
{
"id": 32,
"questionText": "Scenario: You notice DBSCAN marks too many points as noise. Likely cause?",
"options": [
"Algorithm failed",
"All clusters are too dense",
"Distance metric wrong",
"eps too small or minPts too high"
],
"correctAnswerIndex": 3,
"explanation": "Small eps or high minPts can make points unable to form clusters, labeling them as noise."
},
{
"id": 33,
"questionText": "Scenario: DBSCAN applied to social network graph. Challenge?",
"options": [
"Clusters are always detected",
"DBSCAN works directly on graph",
"Noise ignored",
"Graph edges may not correspond to meaningful distances; need transformation"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN requires distance metrics; graphs need embedding or distance conversion."
},
{
"id": 34,
"questionText": "Scenario: Using DBSCAN for anomaly detection in network traffic. How?",
"options": [
"Label low-density patterns as anomalies",
"All high-traffic nodes flagged",
"Randomly assign anomalies",
"Clusters merged manually"
],
"correctAnswerIndex": 0,
"explanation": "Low-density points correspond to unusual patterns, suitable for anomaly detection."
},
{
"id": 35,
"questionText": "Scenario: High-dimensional DBSCAN performance issue. Solution?",
"options": [
"Use dimensionality reduction or HDBSCAN",
"Ignore distance metric",
"Use K-Means instead",
"Increase eps arbitrarily"
],
"correctAnswerIndex": 0,
"explanation": "Reducing dimensions or using hierarchical density clustering helps in high-dimensional spaces."
},
{
"id": 36,
"questionText": "Scenario: Clusters are elongated. DBSCAN vs K-Means?",
"options": [
"K-Means works better",
"All points assigned to noise",
"DBSCAN captures arbitrary shapes better",
"Both fail"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN does not assume spherical clusters, so elongated shapes are captured well."
},
{
"id": 37,
"questionText": "Scenario: DBSCAN fails on variable-density clusters. Solution?",
"options": [
"Reduce minPts to 1",
"Use HDBSCAN for adaptive density clustering",
"Increase eps globally",
"Ignore problem"
],
"correctAnswerIndex": 1,
"explanation": "HDBSCAN handles clusters with varying density better than standard DBSCAN."
},
{
"id": 38,
"questionText": "Scenario: You want reproducible DBSCAN results. Requirement?",
"options": [
"Ignore minPts",
"Deterministic neighbor search and consistent distance metric",
"Random initialization",
"Vary eps each run"
],
"correctAnswerIndex": 1,
"explanation": "Reproducibility requires deterministic calculations for neighborhoods and distances."
},
{
"id": 39,
"questionText": "Scenario: DBSCAN applied on time-series sensor readings. Approach?",
"options": [
"Use sliding windows to extract features before clustering",
"Clusters automatically detected",
"Apply DBSCAN on raw timestamps",
"Ignore feature extraction"
],
"correctAnswerIndex": 0,
"explanation": "Time-series features are extracted to represent temporal patterns for density-based clustering."
},
{
"id": 40,
"questionText": "Scenario: You need clusters and hierarchy. Limitation of DBSCAN?",
"options": [
"Noise ignored",
"DBSCAN provides only flat clustering",
"Automatically generates hierarchy",
"Clusters nested by default"
],
"correctAnswerIndex": 1,
"explanation": "DBSCAN produces flat clusters; hierarchical relationships require extensions like HDBSCAN."
},
{
"id": 41,
"questionText": "Scenario: DBSCAN applied on customer purchase patterns. Advantage?",
"options": [
"Requires predefined cluster number",
"Sensitive to initial seed",
"Detects dense buying behavior groups and isolates rare patterns",
"All points assigned"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN identifies dense purchasing patterns and separates anomalies naturally."
},
{
"id": 42,
"questionText": "Scenario: You want to tune DBSCAN eps parameter. Approach?",
"options": [
"MinPts adjustment only",
"Always choose maximum distance",
"Use k-distance graph to identify elbow point",
"Randomly guess eps"
],
"correctAnswerIndex": 2,
"explanation": "Plotting k-distance helps find a suitable eps where distances start increasing sharply."
},
{
"id": 43,
"questionText": "Scenario: DBSCAN with overlapping clusters. Effect?",
"options": [
"Points duplicated",
"Clusters fail completely",
"Overlap handled by density; border points assigned to one cluster",
"Noise ignored"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN assigns border points to a reachable cluster; soft assignment is not available."
},
{
"id": 44,
"questionText": "Scenario: Applying DBSCAN to text embeddings. Challenge?",
"options": [
"Noise ignored",
"All points assigned to clusters",
"DBSCAN always works",
"High-dimensional distances may be less meaningful"
],
"correctAnswerIndex": 3,
"explanation": "Distance measures in high dimensions can reduce effectiveness; dimensionality reduction helps."
},
{
"id": 45,
"questionText": "Scenario: Noise proportion is high. DBSCAN behavior?",
"options": [
"Many points labeled as noise; cluster detection limited",
"Algorithm fails",
"Clusters detected perfectly",
"All points assigned to clusters"
],
"correctAnswerIndex": 0,
"explanation": "High noise density can prevent formation of dense clusters."
},
{
"id": 46,
"questionText": "Scenario: DBSCAN on streaming data. Limitation?",
"options": [
"Standard DBSCAN is static; needs incremental adaptation",
"All points reassigned automatically",
"Noise ignored",
"Automatically updates clusters"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN is not inherently incremental; streaming data requires modified algorithms."
},
{
"id": 47,
"questionText": "Scenario: DBSCAN vs K-Means for non-spherical clusters. Advantage?",
"options": [
"Both fail",
"K-Means better",
"Noise ignored",
"DBSCAN detects arbitrary shapes; K-Means cannot"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN does not rely on centroid or spherical assumption."
},
{
"id": 48,
"questionText": "Scenario: You apply DBSCAN on noisy sensor readings. Outcome?",
"options": [
"Isolates isolated points as noise automatically",
"Clusters all points",
"Noise merged into clusters",
"Algorithm fails"
],
"correctAnswerIndex": 0,
"explanation": "Low-density or isolated points are correctly treated as noise."
},
{
"id": 49,
"questionText": "Scenario: Choosing distance metric affects DBSCAN. Why?",
"options": [
"All clusters merge",
"No effect",
"Neighborhood depends on distance; cluster shape affected",
"Noise ignored"
],
"correctAnswerIndex": 2,
"explanation": "Different metrics change neighbor counts, affecting core points and cluster formation."
},
{
"id": 50,
"questionText": "Scenario: DBSCAN on highly skewed 2D data. Challenge?",
"options": [
"Clusters detected automatically",
"Algorithm fails",
"Fixed eps may not capture sparse areas",
"Noise reduced"
],
"correctAnswerIndex": 2,
"explanation": "Single eps cannot adapt to varying densities; sparse regions may be misclassified."
},
{
"id": 51,
"questionText": "Scenario: DBSCAN applied to customer segmentation with varying buying density. Issue?",
"options": [
"Noise eliminated automatically",
"Clusters merged randomly",
"All clusters detected perfectly",
"Some smaller or sparser clusters may be missed"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN’s global eps struggles with clusters of different densities; adaptive methods recommended."
},
{
"id": 52,
"questionText": "Scenario: You want DBSCAN to detect small anomalies in large dataset. How to adjust?",
"options": [
"Increase eps arbitrarily",
"Decrease minPts and eps appropriately",
"Ignore small clusters",
"Use K-Means instead"
],
"correctAnswerIndex": 1,
"explanation": "Smaller minPts and eps allow DBSCAN to detect small dense regions representing anomalies."
},
{
"id": 53,
"questionText": "Scenario: Using DBSCAN for clustering Wi-Fi signals in a building. Advantage?",
"options": [
"Identifies dense signal regions and ignores noise",
"All points assigned to clusters",
"Requires number of clusters",
"Clusters must be circular"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN can detect regions with strong signal density and label isolated weak signals as noise."
},
{
"id": 54,
"questionText": "Scenario: DBSCAN on image pixel intensities for segmentation. Outcome?",
"options": [
"Requires predefined cluster number",
"Clusters must be circular",
"All pixels assigned",
"Arbitrary-shaped regions segmented; noise isolated"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN can segment regions of any shape and label scattered pixels as noise."
},
{
"id": 55,
"questionText": "Scenario: Using DBSCAN on 3D point cloud of a city. Advantage?",
"options": [
"Detects clusters like buildings, trees, and separates sparse points",
"Noise merged into clusters",
"All points assigned",
"Clusters must be spherical"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN works in multi-dimensional data and identifies meaningful dense clusters."
},
{
"id": 56,
"questionText": "Scenario: DBSCAN fails with high-dimensional word embeddings. Solution?",
"options": [
"Apply dimensionality reduction before clustering",
"Use K-Means",
"Increase eps globally",
"Ignore problem"
],
"correctAnswerIndex": 0,
"explanation": "High-dimensional spaces make distance less meaningful; reduction helps clustering performance."
},
{
"id": 57,
"questionText": "Scenario: Border points connected to multiple core points. Assignment?",
"options": [
"Assigned to one cluster reachable first",
"Algorithm fails",
"Assigned to all clusters simultaneously",
"Become noise"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN assigns border points to a single cluster; typically the first reachable core point."
},
{
"id": 58,
"questionText": "Scenario: DBSCAN on streaming data. Limitation?",
"options": [
"Noise ignored",
"Automatically updates clusters",
"All points reassigned automatically",
"Standard DBSCAN cannot update incrementally; adaptation needed"
],
"correctAnswerIndex": 3,
"explanation": "Incremental or streaming adaptations of DBSCAN are required for dynamic datasets."
},
{
"id": 59,
"questionText": "Scenario: Clusters are elongated and dense. DBSCAN vs K-Means?",
"options": [
"Both fail",
"K-Means better",
"All points assigned to noise",
"DBSCAN captures shape; K-Means fails with elongated clusters"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN’s density-based approach handles arbitrary shapes like elongated clusters well."
},
{
"id": 60,
"questionText": "Scenario: Choosing minPts parameter. Rule of thumb?",
"options": [
"minPts = dataset size",
"minPts ≥ dimensionality + 1",
"minPts = 1 always",
"minPts ignored"
],
"correctAnswerIndex": 1,
"explanation": "Choosing minPts slightly larger than data dimensionality ensures meaningful cluster formation."
},
{
"id": 61,
"questionText": "Scenario: DBSCAN applied to weather station locations. Advantage?",
"options": [
"All stations assigned",
"Noise merged into clusters",
"Detects dense station clusters and separates isolated stations as noise",
"Clusters must be circular"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN can find groups of stations in dense regions while labeling isolated ones as noise."
},
{
"id": 62,
"questionText": "Scenario: DBSCAN applied to vehicle GPS tracks. Best outcome?",
"options": [
"All vehicles assigned to same cluster",
"Requires predefined cluster number",
"Clusters must be circular",
"Detect hotspots of vehicle activity and identify sparse routes"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN identifies dense routes or locations and marks sparse movements as noise."
},
{
"id": 63,
"questionText": "Scenario: DBSCAN applied to detect fraudulent transactions. Advantage?",
"options": [
"All transactions clustered",
"Isolates unusual low-density transactions as potential fraud",
"Clusters merged arbitrarily",
"Noise ignored"
],
"correctAnswerIndex": 1,
"explanation": "Low-density points are flagged naturally, useful for anomaly detection in finance."
},
{
"id": 64,
"questionText": "Scenario: eps too large. Effect on clusters?",
"options": [
"Clusters may merge; noise reduced",
"Noise increases",
"More clusters detected",
"Algorithm fails"
],
"correctAnswerIndex": 0,
"explanation": "Large eps connects distant points, merging separate clusters and reducing noise."
},
{
"id": 65,
"questionText": "Scenario: eps too small. Effect on clusters?",
"options": [
"Clusters merge",
"Noise decreases",
"Many points labeled as noise; clusters fragmented",
"Algorithm fails"
],
"correctAnswerIndex": 2,
"explanation": "Small eps prevents points from forming dense clusters; many become noise."
},
{
"id": 66,
"questionText": "Scenario: High-dimensional clustering. DBSCAN limitation?",
"options": [
"Clusters detected perfectly",
"All points assigned",
"Distances lose meaning; density estimation difficult",
"Noise ignored"
],
"correctAnswerIndex": 2,
"explanation": "High dimensions make points appear equidistant, complicating density-based clustering."
},
{
"id": 67,
"questionText": "Scenario: Data with multiple density clusters. Solution?",
"options": [
"Use HDBSCAN for adaptive density clustering",
"Increase eps globally",
"Reduce minPts to 1",
"Ignore problem"
],
"correctAnswerIndex": 0,
"explanation": "HDBSCAN adapts to varying densities, unlike standard DBSCAN."
},
{
"id": 68,
"questionText": "Scenario: Using DBSCAN on customer browsing patterns. Advantage?",
"options": [
"Noise ignored",
"Requires predefined cluster number",
"All points assigned",
"Detects dense behavioral patterns and isolates outliers"
],
"correctAnswerIndex": 3,
"explanation": "Dense browsing behaviors form clusters; rare patterns become noise."
},
{
"id": 69,
"questionText": "Scenario: Noise points in DBSCAN. Definition?",
"options": [
"Cluster centroids",
"All points in clusters",
"Points not reachable from any core point",
"Points with minPts neighbors"
],
"correctAnswerIndex": 2,
"explanation": "Noise points are isolated points not part of any cluster."
},
{
"id": 70,
"questionText": "Scenario: Choosing distance metric in DBSCAN. Effect?",
"options": [
"Affects neighborhood definition and cluster shape",
"Noise ignored",
"No effect",
"All points merged"
],
"correctAnswerIndex": 0,
"explanation": "The distance metric changes how neighbors are counted, affecting cluster formation."
},
{
"id": 71,
"questionText": "Scenario: DBSCAN applied to earthquake epicenters. Advantage?",
"options": [
"Clusters must be circular",
"Detects clusters of seismic activity and isolates isolated events",
"Noise merged into clusters",
"All events assigned"
],
"correctAnswerIndex": 1,
"explanation": "DBSCAN identifies dense seismic regions and separates rare events as noise."
},
{
"id": 72,
"questionText": "Scenario: Varying eps across dataset. How to achieve?",
"options": [
"Ignore variation",
"Random eps each run",
"Use adaptive DBSCAN variants like HDBSCAN",
"Standard DBSCAN suffices"
],
"correctAnswerIndex": 2,
"explanation": "Adaptive algorithms adjust density thresholds to handle varying densities."
},
{
"id": 73,
"questionText": "Scenario: Applying DBSCAN on medical imaging. Benefit?",
"options": [
"Clusters must be spherical",
"Requires fixed cluster number",
"Detects regions of interest and separates background noise",
"All pixels clustered"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN segments irregular shapes and isolates sparse/noisy regions."
},
{
"id": 74,
"questionText": "Scenario: Using DBSCAN for anomaly detection in IoT sensors. Approach?",
"options": [
"Ignore isolated readings",
"Label low-density readings as anomalies",
"Cluster all points",
"Random assignment"
],
"correctAnswerIndex": 1,
"explanation": "Isolated readings or sparse patterns naturally become noise, indicating anomalies."
},
{
"id": 75,
"questionText": "Scenario: DBSCAN on financial transactions. Noise points indicate?",
"options": [
"Noise merged",
"All transactions are legitimate",
"Potential fraudulent or unusual transactions",
"Clusters merged"
],
"correctAnswerIndex": 2,
"explanation": "Sparse points in dense transaction space are flagged as unusual or fraudulent."
},
{
"id": 76,
"questionText": "Scenario: DBSCAN applied to traffic accident locations. Advantage?",
"options": [
"Identifies accident hotspots and isolates rare events",
"All accidents assigned",
"Noise merged into clusters",
"Clusters must be circular"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN finds dense accident regions and treats isolated incidents as noise."
},
{
"id": 77,
"questionText": "Scenario: eps and minPts selection using k-distance plot. What is the elbow point?",
"options": [
"Minimum distance",
"Random point",
"Point where distance sharply increases, suitable for eps",
"Maximum distance"
],
"correctAnswerIndex": 2,
"explanation": "The elbow in the k-distance graph indicates the transition from dense to sparse regions, guiding eps selection."
},
{
"id": 78,
"questionText": "Scenario: Border points connected to multiple clusters. Assignment in DBSCAN?",
"options": [
"Assigned to all clusters",
"Become noise",
"Assigned to the first reachable cluster",
"Clusters merge automatically"
],
"correctAnswerIndex": 2,
"explanation": "Border points are assigned to one cluster, typically the first one that reaches them."
},
{
"id": 79,
"questionText": "Scenario: DBSCAN on social media check-ins. Benefit?",
"options": [
"Clusters must be predefined",
"All users assigned",
"Noise ignored",
"Detects popular locations and identifies sparse users"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN identifies dense activity areas and treats isolated check-ins as noise."
},
{
"id": 80,
"questionText": "Scenario: Standard DBSCAN fails on variable density data. Solution?",
"options": [
"Ignore the problem",
"Increase eps globally",
"Decrease minPts arbitrarily",
"Use HDBSCAN for hierarchical density-based clustering"
],
"correctAnswerIndex": 3,
"explanation": "HDBSCAN adapts to varying density, unlike standard DBSCAN."
},
{
"id": 81,
"questionText": "Scenario: DBSCAN on genomic data. Advantage?",
"options": [
"Clusters must be circular",
"All genes assigned",
"Identifies dense gene clusters and isolates rare genes",
"Noise merged"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN can identify dense gene expression patterns and separate sparse or rare genes as noise."
},
{
"id": 82,
"questionText": "Scenario: Choosing minPts too high. Effect?",
"options": [
"Algorithm fails",
"Clusters merge",
"Small clusters ignored; many points labeled noise",
"More clusters detected"
],
"correctAnswerIndex": 2,
"explanation": "High minPts requires dense regions; sparse or small clusters are lost."
},
{
"id": 83,
"questionText": "Scenario: Choosing minPts too low. Effect?",
"options": [
"Many small clusters formed; noise reduced",
"Clusters merge",
"Algorithm fails",
"All points noise"
],
"correctAnswerIndex": 0,
"explanation": "Low minPts allows small groups to form clusters, potentially splitting natural clusters."
},
{
"id": 84,
"questionText": "Scenario: DBSCAN applied on customer location data. Advantage?",
"options": [
"Requires predefined cluster count",
"All points assigned",
"Clusters must be circular",
"Identifies dense shopping areas and isolates isolated customers"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN captures dense shopping locations and labels scattered customers as noise."
},
{
"id": 85,
"questionText": "Scenario: High-dimensional text embeddings. DBSCAN limitation?",
"options": [
"Distances lose meaning; clusters may be unreliable",
"Algorithm faster",
"Noise ignored",
"Clusters always detected"
],
"correctAnswerIndex": 0,
"explanation": "In high dimensions, distances are less discriminative, affecting density and clustering."
},
{
"id": 86,
"questionText": "Scenario: Using DBSCAN on image feature vectors. Benefit?",
"options": [
"Requires predefined cluster count",
"All features assigned",
"Groups similar image features and isolates outliers",
"Clusters must be circular"
],
"correctAnswerIndex": 2,
"explanation": "DBSCAN detects dense feature groups and treats isolated features as noise."
},
{
"id": 87,
"questionText": "Scenario: eps too small. Effect?",
"options": [
"Clusters fragmented; many points labeled noise",
"Clusters merge",
"All points assigned",
"Algorithm fails"
],
"correctAnswerIndex": 0,
"explanation": "Small eps prevents formation of dense clusters; isolated points become noise."
},
{
"id": 88,
"questionText": "Scenario: eps too large. Effect?",
"options": [
"More clusters detected",
"Algorithm fails",
"Clusters merge; fewer noise points",
"Noise increases"
],
"correctAnswerIndex": 2,
"explanation": "Large eps connects distant points, merging separate clusters and reducing noise."
},
{
"id": 89,
"questionText": "Scenario: DBSCAN on irregularly shaped 2D clusters. Advantage?",
"options": [
"Clusters must be circular",
"Captures arbitrary shapes unlike K-Means",
"All points assigned",
"Noise ignored"
],
"correctAnswerIndex": 1,
"explanation": "DBSCAN does not assume cluster shape, so it captures elongated or irregular clusters."
},
{
"id": 90,
"questionText": "Scenario: Border point connected to multiple core points. Assignment?",
"options": [
"Assigned to first reachable cluster",
"Assigned to all clusters",
"Clusters merge",
"Becomes noise"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN assigns a border point to one cluster, typically the first core point that reaches it."
},
{
"id": 91,
"questionText": "Scenario: DBSCAN on IoT sensor anomaly detection. Advantage?",
"options": [
"Sparse readings flagged as anomalies automatically",
"Noise ignored",
"All readings clustered",
"Clusters merged arbitrarily"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN labels low-density points as noise, which is useful for detecting anomalies."
},
{
"id": 92,
"questionText": "Scenario: DBSCAN with streaming data. Limitation?",
"options": [
"Needs adaptation; standard DBSCAN is static",
"Noise ignored",
"Automatically updates clusters",
"All points reassigned automatically"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN is not incremental; streaming or dynamic data requires modified algorithms."
},
{
"id": 93,
"questionText": "Scenario: Using DBSCAN on earthquake data. Benefit?",
"options": [
"Detects dense seismic zones; isolates rare events",
"All events clustered",
"Noise merged",
"Clusters must be circular"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN identifies dense clusters of earthquakes and labels isolated events as noise."
},
{
"id": 94,
"questionText": "Scenario: Noise in DBSCAN definition?",
"options": [
"Cluster centroids",
"Points not reachable from any core point",
"Points with minPts neighbors",
"All points assigned"
],
"correctAnswerIndex": 1,
"explanation": "Noise points are isolated points not part of any cluster."
},
{
"id": 95,
"questionText": "Scenario: Varying density clusters. Best DBSCAN variant?",
"options": [
"Standard DBSCAN",
"K-Means",
"HDBSCAN",
"Agglomerative clustering"
],
"correctAnswerIndex": 2,
"explanation": "HDBSCAN adapts to different densities and creates a hierarchy of clusters."
},
{
"id": 96,
"questionText": "Scenario: Choosing eps using k-distance plot. How?",
"options": [
"Select maximum distance",
"Select value at elbow point where distances sharply rise",
"Randomly select eps",
"Select minimum distance"
],
"correctAnswerIndex": 1,
"explanation": "The elbow point indicates the transition from dense to sparse points, guiding eps choice."
},
{
"id": 97,
"questionText": "Scenario: DBSCAN on customer behavior patterns. Benefit?",
"options": [
"Groups dense behavior patterns; isolates rare customers",
"Requires fixed number of clusters",
"Noise ignored",
"All points assigned"
],
"correctAnswerIndex": 0,
"explanation": "DBSCAN identifies dense behavioral clusters and labels rare behaviors as noise."
},
{
"id": 98,
"questionText": "Scenario: DBSCAN vs K-Means for non-spherical clusters. Advantage?",
"options": [
"K-Means better",
"Noise ignored",
"Both fail",
"DBSCAN captures arbitrary shapes"
],
"correctAnswerIndex": 3,
"explanation": "DBSCAN does not assume cluster shape and handles irregular or elongated clusters."
},
{
"id": 99,
"questionText": "Scenario: High-dimensional DBSCAN problem. Solution?",
"options": [
"Dimensionality reduction (PCA, t-SNE) or HDBSCAN",
"Increase minPts arbitrarily",
"Ignore scaling",
"Use raw distances"
],
"correctAnswerIndex": 0,
"explanation": "High-dimensional spaces make distances less meaningful; reduction or adaptive methods improve clustering."
},
{
"id": 100,
"questionText": "Scenario: Choosing minPts in DBSCAN. Rule of thumb?",
"options": [
"minPts = 1 always",
"minPts = dataset size",
"Ignore minPts",
"minPts ≥ dimensionality + 1"
],
"correctAnswerIndex": 3,
"explanation": "minPts should slightly exceed data dimensionality to ensure meaningful clusters."
}
]
}